framework,version,device,op_name,kernel_source,moe_dtype,num_tokens,hidden_size,inter_size,topk,num_experts,moe_tp_size,moe_ep_size,distribution,latency
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,4096,14336,2,8,1,1,balanced,0.19606933991114298
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,4096,14336,2,8,1,1,balanced,0.11915199955304463
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,4096,14336,2,8,1,1,power_law_1.2,0.1176192045211792
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,4096,14336,2,8,1,1,power_law_1.01,0.11767040491104126
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,4096,14336,2,8,1,1,power_law_1.2,0.1892351984977722
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,4096,14336,2,8,1,1,power_law_1.01,0.18926719427108765
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,4096,14336,2,8,1,1,balanced,0.19572800397872925
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,4096,14336,2,8,1,1,balanced,0.3519573211669922
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,4096,14336,2,8,1,1,power_law_1.01,0.16535040140151977
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,4096,14336,2,8,1,1,power_law_1.2,0.16494079828262329
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,4096,14336,2,8,1,1,power_law_1.01,0.28872320652008054
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,4096,14336,2,8,1,1,balanced,0.35425599416097003
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,4096,14336,2,8,1,1,balanced,0.6599253416061401
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,4096,14336,2,8,1,1,power_law_1.2,0.2734976053237915
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,4096,14336,2,8,1,1,power_law_1.01,0.2234368085861206
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,4096,14336,2,8,1,1,balanced,0.11537599563598633
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,4096,14336,2,8,1,1,power_law_1.2,0.17238399982452393
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,4096,14336,2,8,1,1,power_law_1.01,0.1152448058128357
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,4096,14336,2,8,1,1,power_law_1.01,0.3844095945358276
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,4096,14336,2,8,1,1,power_law_1.2,0.30471038818359375
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,4096,14336,2,8,1,1,balanced,0.358570655186971
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,4096,14336,2,8,1,1,balanced,0.6659733454386393
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,4096,14336,2,8,1,1,power_law_1.01,0.3520319938659668
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,4096,14336,2,8,1,1,power_law_1.2,0.361023998260498
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,4096,14336,2,8,1,1,power_law_1.2,0.6300672054290771
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,4096,14336,2,8,1,1,balanced,0.1948266625404358
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,4096,14336,2,8,1,1,power_law_1.01,0.14023040533065795
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,4096,14336,2,8,1,1,power_law_1.01,0.6462656021118164
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,4096,14336,2,8,1,1,balanced,0.36480534076690674
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,4096,14336,2,8,1,1,power_law_1.01,0.3444607973098755
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,4096,14336,2,8,1,1,power_law_1.2,0.633951997756958
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,4096,14336,2,8,1,1,balanced,0.6694026788075765
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,4096,14336,2,8,1,1,power_law_1.2,0.3598912000656128
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,4096,14336,2,8,1,1,balanced,0.35759464899698895
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,4096,14336,2,8,1,1,power_law_1.01,0.2374720096588135
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,4096,14336,2,8,1,1,power_law_1.2,0.674399995803833
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,4096,14336,2,8,1,1,balanced,0.363264004389445
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,4096,14336,2,8,1,1,power_law_1.01,0.6532864093780517
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,4096,14336,2,8,1,1,power_law_1.01,0.36855039596557615
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,4096,14336,2,8,1,1,power_law_1.2,0.3732991933822632
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,4096,14336,2,8,1,1,balanced,0.6694773038228353
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,4096,14336,2,8,1,1,power_law_1.2,0.6819263935089112
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,4096,14336,2,8,1,1,power_law_1.01,0.33013761043548584
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,4096,14336,2,8,1,1,balanced,0.3617973327636719
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,4096,14336,2,8,1,1,balanced,0.36856532096862793
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,4096,14336,2,8,1,1,power_law_1.01,0.39959039688110354
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,4096,14336,2,8,1,1,power_law_1.01,0.6760767936706543
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,4096,14336,2,8,1,1,power_law_1.2,0.7126272201538086
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,4096,14336,2,8,1,1,power_law_1.2,0.3942847967147827
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,4096,14336,2,8,1,1,balanced,0.6764480272928873
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,4096,14336,2,8,1,1,power_law_1.01,0.3621952056884766
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,4096,14336,2,8,1,1,balanced,0.3639093240102132
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,4096,14336,2,8,1,1,power_law_1.2,0.7081855773925781
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,4096,14336,2,8,1,1,balanced,0.37379201253255206
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,4096,14336,2,8,1,1,power_law_1.01,0.39310081005096437
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,4096,14336,2,8,1,1,power_law_1.01,0.6898176193237304
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,4096,14336,2,8,1,1,power_law_1.2,0.3951551914215088
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,4096,14336,2,8,1,1,power_law_1.2,0.7458303928375244
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,4096,14336,2,8,1,1,balanced,0.6775946617126465
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,4096,14336,2,8,1,1,power_law_1.01,0.3823807954788208
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,4096,14336,2,8,1,1,balanced,0.368341326713562
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,4096,14336,2,8,1,1,power_law_1.01,0.405017614364624
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,4096,14336,2,8,1,1,balanced,0.37781866391499835
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,4096,14336,2,8,1,1,power_law_1.2,0.8106368064880372
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,4096,14336,2,8,1,1,power_law_1.01,0.7146111965179444
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,4096,14336,2,8,1,1,power_law_1.2,0.4020864009857178
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,4096,14336,2,8,1,1,balanced,0.7023306687672933
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,4096,14336,2,8,1,1,balanced,0.3720533450444539
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,4096,14336,2,8,1,1,power_law_1.2,0.8670207977294921
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,4096,14336,2,8,1,1,power_law_1.01,0.4351039886474609
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,4096,14336,2,8,1,1,power_law_1.01,0.40704002380371096
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,4096,14336,2,8,1,1,balanced,0.3766719897588094
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,4096,14336,2,8,1,1,power_law_1.2,0.9628288269042968
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,4096,14336,2,8,1,1,power_law_1.2,0.40577921867370603
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,4096,14336,2,8,1,1,power_law_1.01,0.7265471935272216
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,4096,14336,2,8,1,1,power_law_1.01,0.4209472179412842
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,4096,14336,2,8,1,1,balanced,0.704469362894694
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,4096,14336,2,8,1,1,balanced,0.37778135140736896
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,4096,14336,2,8,1,1,power_law_1.01,0.4727935791015625
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,4096,14336,2,8,1,1,balanced,0.3896266619364421
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,4096,14336,2,8,1,1,power_law_1.2,0.9015551567077636
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,4096,14336,2,8,1,1,power_law_1.01,0.7355008125305176
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,4096,14336,2,8,1,1,power_law_1.2,0.4261439800262451
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,4096,14336,2,8,1,1,power_law_1.01,0.44537601470947263
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,4096,14336,2,8,1,1,power_law_1.2,0.9820032119750977
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,4096,14336,2,8,1,1,balanced,0.7238132953643799
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,4096,14336,2,8,1,1,balanced,0.3911840120951335
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,4096,14336,2,8,1,1,power_law_1.2,0.9711296081542968
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,4096,14336,2,8,1,1,power_law_1.01,0.44537601470947263
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,4096,14336,2,8,1,1,power_law_1.01,0.8261631965637207
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,4096,14336,2,8,1,1,power_law_1.2,0.4389632225036621
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,4096,14336,2,8,1,1,balanced,0.3947360118230184
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,4096,14336,2,8,1,1,balanced,0.7217493057250977
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,4096,14336,2,8,1,1,power_law_1.2,1.1141568183898927
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,4096,14336,2,8,1,1,power_law_1.01,0.503545618057251
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,4096,14336,2,8,1,1,power_law_1.2,0.4622975826263428
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,4096,14336,2,8,1,1,power_law_1.01,0.8294591903686523
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,4096,14336,2,8,1,1,power_law_1.2,1.311788845062256
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,4096,14336,2,8,1,1,balanced,0.4169866641362508
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,4096,14336,2,8,1,1,balanced,0.7229173183441162
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,4096,14336,2,8,1,1,power_law_1.01,0.5213568210601807
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,4096,14336,2,8,1,1,power_law_1.2,1.4202943801879884
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,4096,14336,2,8,1,1,power_law_1.2,0.5043583869934082
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,4096,14336,2,8,1,1,power_law_1.01,0.8616831779479981
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,4096,14336,2,8,1,1,balanced,0.3819040060043335
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,4096,14336,2,8,1,1,power_law_1.01,0.42435197830200194
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,4096,14336,2,8,1,1,balanced,0.42987199624379474
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,4096,14336,2,8,1,1,power_law_1.2,1.7969856262207031
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,4096,14336,2,8,1,1,balanced,0.7796640396118164
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,4096,14336,2,8,1,1,power_law_1.01,0.5371071815490722
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,4096,14336,2,8,1,1,power_law_1.2,0.5161983966827393
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,4096,14336,2,8,1,1,power_law_1.2,2.2307519912719727
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,4096,14336,2,8,1,1,balanced,0.38762664794921875
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,4096,14336,2,8,1,1,power_law_1.01,0.9249343872070312
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,4096,14336,2,8,1,1,power_law_1.01,0.47416319847106936
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,4096,14336,2,8,1,1,balanced,0.43460798263549805
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,4096,14336,2,8,1,1,balanced,0.7776052951812744
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,4096,14336,2,8,1,1,power_law_1.01,0.6271679878234864
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,4096,14336,2,8,1,1,power_law_1.2,3.0833856582641603
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,4096,14336,2,8,1,1,power_law_1.2,0.5414400100708008
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,4096,14336,2,8,1,1,power_law_1.01,0.9405183792114258
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,4096,14336,2,8,1,1,balanced,0.7812960147857666
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,4096,14336,2,8,1,1,balanced,0.48262401421864826
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,4096,14336,2,8,1,1,power_law_1.01,0.6795008182525635
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,4096,14336,2,8,1,1,power_law_1.2,3.908243179321289
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,4096,14336,2,8,1,1,power_law_1.2,0.6271743774414062
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,4096,14336,2,8,1,1,power_law_1.01,0.9749055862426758
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,4096,14336,2,8,1,1,balanced,0.8705920378367106
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,4096,14336,2,8,1,1,power_law_1.01,0.7811327934265136
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,4096,14336,2,8,1,1,balanced,0.6015573342641195
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,4096,14336,2,8,1,1,power_law_1.2,5.823820877075195
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,4096,14336,2,8,1,1,power_law_1.2,0.702617597579956
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,4096,14336,2,8,1,1,power_law_1.01,1.1552639961242677
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,4096,14336,2,8,1,1,power_law_1.01,1.006284809112549
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,4096,14336,2,8,1,1,balanced,0.9940746625264486
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,4096,14336,2,8,1,1,balanced,0.6201440095901489
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,4096,14336,2,8,1,1,power_law_1.2,7.794156646728515
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,4096,14336,2,8,1,1,power_law_1.01,1.2709055900573731
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,4096,14336,2,8,1,1,power_law_1.2,0.7712575912475585
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,4096,14336,2,8,1,1,power_law_1.01,1.2920063972473144
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,4096,14336,2,8,1,1,balanced,1.013594627380371
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,4096,14336,2,8,1,1,balanced,0.842741330464681
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,4096,14336,2,8,1,1,power_law_1.2,11.625682830810547
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,4096,14336,2,8,1,1,power_law_1.2,1.0101183891296386
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,4096,14336,2,8,1,1,power_law_1.01,1.7617279052734376
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,4096,14336,2,8,1,1,power_law_1.01,1.3604864120483398
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,4096,14336,2,8,1,1,balanced,1.403216044108073
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,4096,14336,2,8,1,1,balanced,1.0668213367462158
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,4096,14336,2,8,1,1,balanced,0.40447998046875
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,4096,14336,2,8,1,1,power_law_1.01,0.43494400978088377
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,4096,14336,2,8,1,1,power_law_1.2,15.08922882080078
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,4096,14336,2,8,1,1,power_law_1.2,1.2790656089782715
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,4096,14336,2,8,1,1,power_law_1.01,2.2449663162231444
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,4096,14336,2,8,1,1,power_law_1.01,1.7892864227294922
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,4096,14336,2,8,1,1,balanced,0.41418667634328205
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,4096,14336,2,8,1,1,balanced,1.8056532541910808
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,4096,14336,2,8,1,1,balanced,1.549338658650716
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,4096,14336,2,8,1,1,power_law_1.01,0.4770751953125
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,4096,14336,2,8,1,1,power_law_1.2,1.7319679260253906
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,4096,14336,2,8,1,1,power_law_1.01,3.2165374755859375
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,4096,14336,2,8,1,1,power_law_1.2,18.785005187988283
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,4096,14336,2,8,1,1,power_law_1.01,2.2416576385498046
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,4096,14336,2,8,1,1,balanced,0.4211146831512451
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,4096,14336,2,8,1,1,power_law_1.01,0.4804096221923828
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,4096,14336,2,8,1,1,balanced,2.6243786811828613
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,4096,14336,2,8,1,1,power_law_1.2,2.2112064361572266
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,4096,14336,2,8,1,1,power_law_1.01,4.138809585571289
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,4096,14336,2,8,1,1,balanced,2.0416107177734375
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,4096,14336,2,8,1,1,power_law_1.01,3.0879039764404297
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,4096,14336,2,8,1,1,balanced,0.4364480177561442
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,4096,14336,2,8,1,1,power_law_1.01,0.5465216159820556
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,4096,14336,2,8,1,1,power_law_1.2,3.1765056610107423
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,4096,14336,2,8,1,1,power_law_1.01,6.189459228515625
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,4096,14336,2,8,1,1,balanced,0.4867039918899536
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,4096,14336,2,8,1,1,balanced,3.479215939839681
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,4096,14336,2,8,1,1,power_law_1.2,29.946688842773437
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,4096,14336,2,8,1,1,power_law_1.01,3.87562255859375
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,4096,14336,2,8,1,1,balanced,3.022320111592611
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,4096,14336,2,8,1,1,power_law_1.01,0.548851203918457
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,4096,14336,2,8,1,1,balanced,0.5073066552480062
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,4096,14336,2,8,1,1,power_law_1.2,4.299916839599609
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,4096,14336,2,8,1,1,power_law_1.01,8.563340759277343
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,4096,14336,2,8,1,1,power_law_1.01,0.5901055812835694
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,4096,14336,2,8,1,1,power_law_1.01,5.782912063598633
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,4096,14336,2,8,1,1,balanced,5.331173261006673
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,4096,14336,2,8,1,1,balanced,0.5384053389231364
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,4096,14336,2,8,1,1,balanced,3.9949334462483725
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,4096,14336,2,8,1,1,power_law_1.01,0.6911295890808106
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,4096,14336,2,8,1,1,power_law_1.2,6.409849548339844
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,4096,14336,2,8,1,1,power_law_1.01,10.809126281738282
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,4096,14336,2,8,1,1,balanced,0.8323093255360922
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,4096,14336,2,8,1,1,power_law_1.01,7.690054321289063
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,4096,14336,2,8,1,1,power_law_1.01,0.9013759613037109
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,4096,14336,2,8,1,1,balanced,7.433408101399739
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,4096,14336,2,8,1,1,power_law_1.2,60.22822875976563
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,4096,14336,2,8,1,1,power_law_1.2,8.708882904052734
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,4096,14336,2,8,1,1,balanced,0.8919359842936198
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,4096,14336,2,8,1,1,balanced,6.218016306559245
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,4096,14336,2,8,1,1,power_law_1.01,1.121343994140625
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,4096,14336,2,8,1,1,power_law_1.01,16.850758361816407
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,4096,14336,2,8,1,1,power_law_1.01,11.599603271484375
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,4096,14336,2,8,1,1,balanced,1.3180639743804932
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,4096,14336,2,8,1,1,power_law_1.01,1.5283647537231446
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,4096,14336,2,8,1,1,power_law_1.2,10.887987518310547
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,4096,14336,2,8,1,1,balanced,11.274842580159506
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,4096,14336,2,8,1,1,power_law_1.01,15.174374389648438
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,4096,14336,2,8,1,1,balanced,1.7896426518758137
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,4096,14336,2,8,1,1,power_law_1.01,1.9567552566528321
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,4096,14336,2,8,1,1,balanced,8.366320292154947
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,4096,14336,2,8,1,1,power_law_1.01,33.98496704101562
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,4096,14336,2,8,1,1,power_law_1.2,16.97875213623047
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,4096,14336,2,8,1,1,power_law_1.01,2.829875183105469
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,4096,14336,2,8,1,1,balanced,2.6841866175333657
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,4096,14336,2,8,1,1,power_law_1.01,18.783692932128908
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,4096,14336,2,8,1,1,power_law_1.01,3.7208511352539064
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,4096,14336,2,8,1,1,balanced,14.751295725504557
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,4096,14336,2,8,1,1,balanced,3.560672124226888
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,4096,14336,2,8,1,1,power_law_1.01,5.496031951904297
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,4096,14336,2,8,1,1,balanced,10.428927739461264
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,4096,14336,2,8,1,1,power_law_1.2,34.0419189453125
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,4096,14336,2,8,1,1,power_law_1.01,29.79552001953125
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,4096,14336,2,8,1,1,balanced,5.401472091674805
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,4096,14336,2,8,1,1,power_law_1.01,7.188441467285156
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,4096,14336,2,8,1,1,balanced,18.29796854654948
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,4096,14336,2,8,1,1,balanced,7.176607767740886
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,4096,14336,2,8,1,1,power_law_1.01,10.878214263916016
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,4096,14336,2,8,1,1,balanced,16.632816314697266
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,4096,14336,2,8,1,1,power_law_1.01,14.598764038085937
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,4096,14336,2,8,1,1,power_law_1.01,60.08173828125
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,4096,14336,2,8,1,1,balanced,10.73907216389974
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,4096,14336,2,8,1,1,power_law_1.01,18.278720092773437
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,4096,14336,2,8,1,1,balanced,29.1754887898763
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,4096,14336,2,8,1,1,balanced,14.401728312174479
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,4096,14336,2,8,1,1,power_law_1.01,30.59566650390625
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,4096,14336,2,8,1,1,balanced,18.02192560831706
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,4096,14336,2,8,1,1,balanced,33.83084360758463
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,4096,14336,2,8,1,1,power_law_1.01,65.15950927734374
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,4096,14336,2,8,1,1,balanced,59.035074869791664
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,4096,14336,2,8,1,1,balanced,29.42656962076823
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,4096,14336,2,8,1,1,balanced,64.64781188964844
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,6144,16384,2,8,1,1,balanced,0.347978671391805
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,4096,14336,2,8,1,1,power_law_1.2,0.11471359729766846
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,6144,16384,2,8,1,1,balanced,0.19260799884796143
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,4096,14336,2,8,1,1,power_law_1.2,0.1493183970451355
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,6144,16384,2,8,1,1,balanced,0.5802559852600098
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,4096,14336,2,8,1,1,power_law_1.2,0.1978368043899536
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,6144,16384,2,8,1,1,balanced,1.1250879764556885
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,6144,16384,2,8,1,1,balanced,0.3109760085741679
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,4096,14336,2,8,1,1,power_law_1.2,0.3459455966949463
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,6144,16384,2,8,1,1,balanced,1.1282613277435303
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,6144,16384,2,8,1,1,balanced,0.5846186478932699
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,4096,14336,2,8,1,1,power_law_1.2,0.35530240535736085
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,6144,16384,2,8,1,1,balanced,0.5892213185628256
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,6144,16384,2,8,1,1,balanced,1.124346653620402
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,4096,14336,2,8,1,1,power_law_1.2,0.3942847967147827
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,6144,16384,2,8,1,1,balanced,0.5898986657460531
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,6144,16384,2,8,1,1,balanced,1.129850705464681
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,4096,14336,2,8,1,1,power_law_1.2,0.4321983814239502
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,6144,16384,2,8,1,1,balanced,0.5978933175404867
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,6144,16384,2,8,1,1,balanced,1.1362826824188232
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,4096,14336,2,8,1,1,power_law_1.2,0.46764798164367677
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,6144,16384,2,8,1,1,balanced,0.6001706520716349
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,6144,16384,2,8,1,1,balanced,1.1417333285013835
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,6144,16384,2,8,1,1,balanced,0.6067253351211548
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,6144,16384,2,8,1,1,balanced,1.1781439781188965
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,6144,16384,2,8,1,1,balanced,0.6095519860585531
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,6144,16384,2,8,1,1,balanced,1.1850559711456299
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,4096,14336,2,8,1,1,power_law_1.2,0.4482431888580322
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,6144,16384,2,8,1,1,balanced,0.6140906810760498
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,6144,16384,2,8,1,1,balanced,1.1814186573028564
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,6144,16384,2,8,1,1,balanced,0.6287253300348917
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,4096,14336,2,8,1,1,power_law_1.2,0.46085758209228517
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,6144,16384,2,8,1,1,balanced,1.1938506762186687
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,6144,16384,2,8,1,1,balanced,0.6341280142466227
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,6144,16384,2,8,1,1,balanced,1.2004480361938477
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,6144,16384,2,8,1,1,balanced,0.6418666839599609
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,6144,16384,2,8,1,1,balanced,0.18769067525863647
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,4096,14336,2,8,1,1,power_law_1.2,0.43612160682678225
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,6144,16384,2,8,1,1,balanced,1.3017226854960124
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,6144,16384,2,8,1,1,balanced,0.6927146911621094
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,6144,16384,2,8,1,1,balanced,0.3148053288459778
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,6144,16384,2,8,1,1,balanced,1.2711946964263916
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,4096,14336,2,8,1,1,power_law_1.2,0.46167678833007814
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,6144,16384,2,8,1,1,balanced,0.6873813470204672
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,6144,16384,2,8,1,1,balanced,0.5889653364817301
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,6144,16384,2,8,1,1,balanced,1.2899093627929688
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,4096,14336,2,8,1,1,power_law_1.2,0.47600641250610354
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,6144,16384,2,8,1,1,balanced,0.6840213139851888
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,6144,16384,2,8,1,1,balanced,0.5932586590449015
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,4096,14336,2,8,1,1,power_law_1.2,0.5534912109375
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,6144,16384,2,8,1,1,balanced,0.7310506502787272
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,6144,16384,2,8,1,1,balanced,1.343450705210368
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,6144,16384,2,8,1,1,balanced,0.5969173510869344
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,4096,14336,2,8,1,1,power_law_1.2,0.5596288204193115
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,6144,16384,2,8,1,1,balanced,0.9160640239715576
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,6144,16384,2,8,1,1,balanced,1.6324747403462727
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,6144,16384,2,8,1,1,power_law_1.01,0.2964544057846069
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,6144,16384,2,8,1,1,power_law_1.01,0.1923583984375
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,6144,16384,2,8,1,1,balanced,0.6020053227742513
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,4096,14336,2,8,1,1,power_law_1.2,0.5738624095916748
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,6144,16384,2,8,1,1,balanced,0.9399680296579996
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,6144,16384,2,8,1,1,balanced,1.6410773595174153
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,6144,16384,2,8,1,1,balanced,0.6082079807917277
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,6144,16384,2,8,1,1,power_law_1.01,0.4576767921447754
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,6144,16384,2,8,1,1,power_law_1.01,0.24010241031646729
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,4096,14336,2,8,1,1,power_law_1.2,0.7145599842071533
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,6144,16384,2,8,1,1,balanced,1.3311253388722737
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,6144,16384,2,8,1,1,balanced,2.3442506790161133
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,6144,16384,2,8,1,1,balanced,0.6132853428522745
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,6144,16384,2,8,1,1,power_law_1.01,0.6484608173370361
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,6144,16384,2,8,1,1,power_law_1.01,0.3301440000534058
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,6144,16384,2,8,1,1,power_law_1.01,0.17704960107803344
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,4096,14336,2,8,1,1,power_law_1.2,0.881772804260254
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,6144,16384,2,8,1,1,balanced,1.6711947123209636
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,6144,16384,2,8,1,1,power_law_1.01,0.5873151779174804
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,6144,16384,2,8,1,1,balanced,2.961477279663086
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,6144,16384,2,8,1,1,power_law_1.01,1.1262847900390625
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,6144,16384,2,8,1,1,power_law_1.01,0.22305281162261964
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,4096,14336,2,8,1,1,power_law_1.2,1.1054143905639648
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,6144,16384,2,8,1,1,power_law_1.01,0.5741888046264648
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,6144,16384,2,8,1,1,balanced,2.4273173014322915
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,6144,16384,2,8,1,1,power_law_1.01,1.1244095802307128
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,6144,16384,2,8,1,1,power_law_1.01,0.2774784088134766
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,6144,16384,2,8,1,1,balanced,4.492042541503906
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,4096,14336,2,8,1,1,power_law_1.2,1.5472831726074219
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,6144,16384,2,8,1,1,power_law_1.01,0.5905983924865723
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,6144,16384,2,8,1,1,power_law_1.01,1.1162240028381347
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,6144,16384,2,8,1,1,power_law_1.01,0.5663487911224365
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,6144,16384,2,8,1,1,balanced,0.6207413276036581
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,4096,14336,2,8,1,1,power_law_1.2,1.9647552490234375
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,6144,16384,2,8,1,1,balanced,3.272864023844401
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,6144,16384,2,8,1,1,balanced,6.018218358357747
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,6144,16384,2,8,1,1,power_law_1.01,0.6401599884033203
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,6144,16384,2,8,1,1,power_law_1.01,0.5822527885437012
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,6144,16384,2,8,1,1,power_law_1.01,1.1793791770935058
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,6144,16384,2,8,1,1,balanced,0.6273333231608073
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,4096,14336,2,8,1,1,power_law_1.2,2.8372159957885743
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,6144,16384,2,8,1,1,power_law_1.01,0.6389311790466309
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,6144,16384,2,8,1,1,power_law_1.01,0.6310080051422119
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,6144,16384,2,8,1,1,power_law_1.01,1.2045439720153808
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,6144,16384,2,8,1,1,balanced,4.960890769958496
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,6144,16384,2,8,1,1,balanced,9.463701248168945
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,4096,14336,2,8,1,1,power_law_1.2,3.7038272857666015
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,6144,16384,2,8,1,1,power_law_1.01,0.7347263813018798
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,6144,16384,2,8,1,1,power_law_1.01,1.2004608154296874
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,6144,16384,2,8,1,1,power_law_1.01,0.654585599899292
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,6144,16384,2,8,1,1,power_law_1.2,0.308351993560791
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,4096,14336,2,8,1,1,power_law_1.2,5.447430419921875
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,6144,16384,2,8,1,1,balanced,6.855578740437825
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,6144,16384,2,8,1,1,power_law_1.01,0.7565567970275879
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,6144,16384,2,8,1,1,power_law_1.01,1.2625856399536133
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,6144,16384,2,8,1,1,power_law_1.01,0.6722367763519287
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,6144,16384,2,8,1,1,balanced,12.861072540283203
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,6144,16384,2,8,1,1,power_law_1.2,0.4008063793182373
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,6144,16384,2,8,1,1,power_law_1.01,1.2991423606872559
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,4096,14336,2,8,1,1,power_law_1.2,7.191661071777344
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,6144,16384,2,8,1,1,power_law_1.2,0.5042111873626709
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,6144,16384,2,8,1,1,power_law_1.01,0.698137617111206
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,6144,16384,2,8,1,1,power_law_1.2,1.0406911849975586
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,6144,16384,2,8,1,1,power_law_1.01,1.3907072067260742
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,6144,16384,2,8,1,1,balanced,10.321749369303385
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,6144,16384,2,8,1,1,power_law_1.01,0.7409088134765625
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,6144,16384,2,8,1,1,power_law_1.01,0.7120063781738282
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,4096,14336,2,8,1,1,power_law_1.2,10.808518218994141
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,6144,16384,2,8,1,1,power_law_1.2,1.1279359817504884
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,6144,16384,2,8,1,1,balanced,0.642357349395752
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,6144,16384,2,8,1,1,power_law_1.01,1.4627008438110352
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,6144,16384,2,8,1,1,balanced,19.02886454264323
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,6144,16384,2,8,1,1,power_law_1.2,1.1295424461364747
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,6144,16384,2,8,1,1,power_law_1.01,0.780185604095459
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,6144,16384,2,8,1,1,power_law_1.01,0.77706880569458
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,6144,16384,2,8,1,1,balanced,0.6569120089213053
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,6144,16384,2,8,1,1,power_law_1.2,1.2161151885986328
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,6144,16384,2,8,1,1,power_law_1.01,1.4482432365417481
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,4096,14336,2,8,1,1,power_law_1.2,14.443475341796875
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,6144,16384,2,8,1,1,power_law_1.2,1.1917887687683106
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,6144,16384,2,8,1,1,power_law_1.01,0.7751167774200439
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,6144,16384,2,8,1,1,balanced,0.6657600005467733
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,6144,16384,2,8,1,1,balanced,14.047354380289713
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,6144,16384,2,8,1,1,power_law_1.01,1.5499199867248534
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,6144,16384,2,8,1,1,power_law_1.2,1.2008895874023438
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,6144,16384,2,8,1,1,power_law_1.01,0.8686911582946777
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,6144,16384,2,8,1,1,balanced,0.6870986620585123
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,6144,16384,2,8,1,1,power_law_1.01,0.690060806274414
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,6144,16384,2,8,1,1,power_law_1.2,1.349567985534668
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,4096,14336,2,8,1,1,power_law_1.2,18.437228393554687
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,6144,16384,2,8,1,1,power_law_1.01,1.647782325744629
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,6144,16384,2,8,1,1,balanced,25.050069173177082
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,6144,16384,2,8,1,1,power_law_1.2,1.3272704124450683
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,6144,16384,2,8,1,1,balanced,0.7467466990152994
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,6144,16384,2,8,1,1,power_law_1.01,0.8688639640808106
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,6144,16384,2,8,1,1,power_law_1.01,0.7524991989135742
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,6144,16384,2,8,1,1,power_law_1.01,1.717318344116211
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,6144,16384,2,8,1,1,power_law_1.2,1.4109248161315917
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,6144,16384,2,8,1,1,balanced,0.7709333101908366
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,6144,16384,2,8,1,1,power_law_1.01,0.9291135787963867
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,6144,16384,2,8,1,1,power_law_1.01,0.7967743873596191
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,6144,16384,2,8,1,1,power_law_1.2,1.5613696098327636
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,6144,16384,2,8,1,1,balanced,17.731802622477215
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,6144,16384,2,8,1,1,power_law_1.01,2.0307775497436524
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,6144,16384,2,8,1,1,balanced,0.8154346942901611
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,4096,14336,2,8,1,1,power_law_1.2,30.280126953125
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,6144,16384,2,8,1,1,power_law_1.2,1.4885760307312013
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,6144,16384,2,8,1,1,power_law_1.01,1.0787839889526367
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,6144,16384,2,8,1,1,power_law_1.01,0.9025856018066406
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,6144,16384,2,8,1,1,balanced,1.3122133413950603
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,6144,16384,2,8,1,1,power_law_1.2,1.575660800933838
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,6144,16384,2,8,1,1,power_law_1.01,2.358201599121094
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,6144,16384,2,8,1,1,power_law_1.01,0.867955207824707
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,6144,16384,2,8,1,1,power_law_1.01,1.2731136322021483
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,6144,16384,2,8,1,1,power_law_1.2,1.5834624290466308
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,6144,16384,2,8,1,1,balanced,31.60523223876953
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,6144,16384,2,8,1,1,balanced,1.3996480305989583
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,6144,16384,2,8,1,1,power_law_1.01,3.2097152709960937
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,6144,16384,2,8,1,1,power_law_1.2,1.83624324798584
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,6144,16384,2,8,1,1,power_law_1.01,0.9423999786376953
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,6144,16384,2,8,1,1,power_law_1.01,1.679539108276367
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,6144,16384,2,8,1,1,power_law_1.2,2.1215295791625977
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,6144,16384,2,8,1,1,balanced,2.1196212768554688
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,6144,16384,2,8,1,1,power_law_1.01,3.645452880859375
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,6144,16384,2,8,1,1,power_law_1.01,1.122265625
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,6144,16384,2,8,1,1,power_law_1.01,2.042406463623047
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,6144,16384,2,8,1,1,power_law_1.2,2.355289649963379
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,6144,16384,2,8,1,1,balanced,2.793930689493815
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,6144,16384,2,8,1,1,power_law_1.01,1.421292781829834
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,4096,14336,2,8,1,1,power_law_1.2,64.184765625
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,6144,16384,2,8,1,1,power_law_1.2,3.1389951705932617
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,6144,16384,2,8,1,1,balanced,27.479995727539062
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,6144,16384,2,8,1,1,power_law_1.01,5.321363067626953
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,6144,16384,2,8,1,1,power_law_1.01,2.768083190917969
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,6144,16384,2,8,1,1,power_law_1.2,3.642483139038086
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,6144,16384,2,8,1,1,power_law_1.01,1.7916351318359376
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,6144,16384,2,8,1,1,balanced,4.26195748647054
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,6144,16384,2,8,1,1,power_law_1.01,3.638111877441406
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,6144,16384,2,8,1,1,power_law_1.01,6.927961730957032
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,6144,16384,2,8,1,1,power_law_1.2,5.260153579711914
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,6144,16384,2,8,1,1,power_law_1.01,2.4949504852294924
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,6144,16384,2,8,1,1,power_law_1.01,5.339788818359375
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,6144,16384,2,8,1,1,balanced,5.776959737141927
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,6144,16384,2,8,1,1,power_law_1.2,6.966860961914063
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,6144,16384,2,8,1,1,balanced,49.324066162109375
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,6144,16384,2,8,1,1,power_law_1.01,9.891820526123047
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,6144,16384,2,8,1,1,power_law_1.01,3.1469823837280275
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,6144,16384,2,8,1,1,power_law_1.2,10.068697357177735
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,6144,16384,2,8,1,1,power_law_1.01,7.086975860595703
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,6144,16384,2,8,1,1,balanced,8.733162562052408
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,6144,16384,2,8,1,1,power_law_1.01,4.530169677734375
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,6144,16384,2,8,1,1,power_law_1.01,13.333261108398437
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,6144,16384,2,8,1,1,power_law_1.2,12.824557495117187
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,6144,16384,2,8,1,1,power_law_1.01,10.745670318603516
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,6144,16384,2,8,1,1,power_law_1.01,5.929849624633789
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,6144,16384,2,8,1,1,balanced,12.009194691975912
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,6144,16384,2,8,1,1,power_law_1.2,19.747378540039062
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,6144,16384,2,8,1,1,power_law_1.01,19.631193542480467
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,6144,16384,2,8,1,1,power_law_1.01,14.1780029296875
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,6144,16384,2,8,1,1,power_law_1.01,9.092665863037109
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,6144,16384,2,8,1,1,power_law_1.2,26.5761474609375
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,6144,16384,2,8,1,1,balanced,55.1008555094401
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,6144,16384,2,8,1,1,power_law_1.01,26.415499877929687
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,6144,16384,2,8,1,1,balanced,18.21661885579427
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,6144,16384,2,8,1,1,power_law_1.01,18.074783325195312
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,6144,16384,2,8,1,1,power_law_1.01,12.079590606689454
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,6144,16384,2,8,1,1,power_law_1.2,33.044793701171876
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,6144,16384,2,8,1,1,power_law_1.01,32.831295776367185
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,6144,16384,2,8,1,1,power_law_1.01,18.841477966308595
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,6144,16384,2,8,1,1,power_law_1.01,27.710629272460938
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,6144,16384,2,8,1,1,balanced,24.933990478515625
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,6144,16384,2,8,1,1,balanced,98.55668131510417
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,6144,16384,2,8,1,1,power_law_1.2,49.87726745605469
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,6144,16384,2,8,1,1,power_law_1.01,25.49605712890625
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,6144,16384,2,8,1,1,power_law_1.01,50.627359008789064
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,6144,16384,2,8,1,1,power_law_1.01,55.0374755859375
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,6144,16384,2,8,1,1,balanced,31.970484415690105
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,6144,16384,2,8,1,1,power_law_1.01,32.55896911621094
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,6144,16384,2,8,1,1,power_law_1.2,99.32092895507813
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,6144,16384,2,8,1,1,power_law_1.01,55.46712036132813
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,6144,16384,2,8,1,1,power_law_1.01,99.73851318359375
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,6144,16384,2,8,1,1,balanced,55.1559804280599
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,6144,16384,2,8,1,1,power_law_1.01,115.61666259765624
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,6144,16384,2,8,1,1,balanced,119.8536885579427
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,6144,16384,2,8,1,1,power_law_1.2,0.1763327956199646
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,6144,16384,2,8,1,1,power_law_1.2,0.2663167953491211
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,6144,16384,2,8,1,1,power_law_1.2,0.2824831962585449
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,6144,16384,2,8,1,1,power_law_1.2,0.5592895984649658
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,6144,16384,2,8,1,1,power_law_1.2,0.589631986618042
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,6144,16384,2,8,1,1,power_law_1.2,0.6244736194610596
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,6144,16384,2,8,1,1,power_law_1.2,0.6504191875457763
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,6144,16384,2,8,1,1,power_law_1.2,0.6334464073181152
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,6144,16384,2,8,1,1,power_law_1.2,0.680134391784668
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,6144,16384,2,8,1,1,power_law_1.2,0.6915264129638672
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,6144,16384,2,8,1,1,power_law_1.2,0.6756288051605225
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,6144,16384,2,8,1,1,power_law_1.2,0.7183487892150879
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,6144,16384,2,8,1,1,power_law_1.2,0.7077055931091308
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,6144,16384,2,8,1,1,power_law_1.2,0.790227222442627
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,6144,16384,2,8,1,1,power_law_1.2,0.17813760042190552
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,6144,16384,2,8,1,1,power_law_1.2,0.832908821105957
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,6144,16384,2,8,1,1,power_law_1.2,0.8439680099487304
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,6144,16384,2,8,1,1,power_law_1.2,0.26845440864562986
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,6144,16384,2,8,1,1,power_law_1.2,0.9234623908996582
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,6144,16384,2,8,1,1,power_law_1.2,0.31655681133270264
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,6144,16384,2,8,1,1,power_law_1.2,0.56430082321167
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,6144,16384,2,8,1,1,power_law_1.2,1.145849609375
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,6144,16384,2,8,1,1,power_law_1.2,0.569708776473999
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,6144,16384,2,8,1,1,power_law_1.2,1.2741312026977538
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,6144,16384,2,8,1,1,power_law_1.2,0.6742464065551758
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,6144,16384,2,8,1,1,power_law_1.2,1.6686399459838868
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,6144,16384,2,8,1,1,power_law_1.2,0.7248703956604003
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,6144,16384,2,8,1,1,power_law_1.2,2.0256576538085938
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,6144,16384,2,8,1,1,power_law_1.2,0.803923225402832
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,6144,16384,2,8,1,1,power_law_1.2,2.8273088455200197
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,6144,16384,2,8,1,1,power_law_1.2,3.648223876953125
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,6144,16384,2,8,1,1,power_law_1.2,0.7350016117095948
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,6144,16384,2,8,1,1,power_law_1.2,5.243059158325195
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,6144,16384,2,8,1,1,power_law_1.2,0.7800767898559571
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,6144,16384,2,8,1,1,power_law_1.2,7.109561920166016
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,6144,16384,2,8,1,1,power_law_1.2,10.567494201660157
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,6144,16384,2,8,1,1,power_law_1.2,0.7024256229400635
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,7168,2048,8,256,1,1,balanced,0.22152000665664673
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,6144,16384,2,8,1,1,power_law_1.2,0.7714240074157714
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,6144,16384,2,8,1,1,power_law_1.2,14.453581237792969
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,6144,16384,2,8,1,1,power_law_1.2,0.7934976100921631
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,7168,2048,8,256,1,1,balanced,0.3622399965922038
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,6144,16384,2,8,1,1,power_law_1.2,0.9231167793273926
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,7168,2048,8,256,1,1,balanced,0.6803092956542969
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,6144,16384,2,8,1,1,power_law_1.2,18.276824951171875
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,6144,16384,2,8,1,1,power_law_1.2,0.8689727783203125
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,7168,2048,8,256,1,1,balanced,1.3332053025563557
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,6144,16384,2,8,1,1,power_law_1.2,0.9532032012939453
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,7168,2048,8,256,1,1,balanced,2.6241013209025064
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,6144,16384,2,8,1,1,power_law_1.2,1.0897343635559082
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,7168,2048,8,256,1,1,balanced,5.158416112263997
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,6144,16384,2,8,1,1,power_law_1.2,27.871182250976563
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,6144,16384,2,8,1,1,power_law_1.2,1.4074687957763672
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,7168,2048,8,256,1,1,balanced,0.13486933708190918
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,7168,2048,8,256,1,1,balanced,5.175600051879883
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,6144,16384,2,8,1,1,power_law_1.2,1.7112512588500977
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,7168,2048,8,256,1,1,balanced,0.2060693303743998
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,7168,2048,8,256,1,1,balanced,5.227072079976399
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,6144,16384,2,8,1,1,power_law_1.2,2.4490175247192383
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,7168,2048,8,256,1,1,balanced,0.3657333453496297
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,7168,2048,8,256,1,1,balanced,0.6978773276011149
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,6144,16384,2,8,1,1,power_law_1.2,3.137068748474121
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,7168,2048,8,256,1,1,balanced,5.213184038798015
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,7168,2048,8,256,1,1,balanced,1.3514827092488606
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,6144,16384,2,8,1,1,power_law_1.2,54.82216186523438
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,6144,16384,2,8,1,1,power_law_1.2,4.524192047119141
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,7168,2048,8,256,1,1,balanced,2.629765351613363
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,7168,2048,8,256,1,1,balanced,5.198527971903483
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,7168,2048,8,256,1,1,balanced,2.6305440266927085
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,7168,2048,8,256,1,1,power_law_1.01,0.2230463981628418
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,6144,16384,2,8,1,1,power_law_1.2,5.955276870727539
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,7168,2048,8,256,1,1,balanced,5.231290817260742
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,7168,2048,8,256,1,1,balanced,2.627247969309489
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,7168,2048,8,256,1,1,balanced,2.6601813634236655
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,7168,2048,8,256,1,1,power_law_1.01,0.362009596824646
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,7168,2048,8,256,1,1,balanced,5.249034563700358
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,6144,16384,2,8,1,1,power_law_1.2,9.042444610595703
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,7168,2048,8,256,1,1,balanced,2.6517653465270996
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,7168,2048,8,256,1,1,power_law_1.01,0.43251838684082033
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,7168,2048,8,256,1,1,balanced,2.664992014567057
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,7168,2048,8,256,1,1,balanced,5.267258644104004
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,7168,2048,8,256,1,1,balanced,0.18303465843200684
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,6144,16384,2,8,1,1,power_law_1.2,12.087961578369141
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,7168,2048,8,256,1,1,balanced,2.692234675089518
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,7168,2048,8,256,1,1,power_law_1.01,0.9671615600585938
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,7168,2048,8,256,1,1,balanced,5.312944094340007
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,7168,2048,8,256,1,1,balanced,0.24450133244196573
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,7168,2048,8,256,1,1,balanced,2.707514762878418
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,7168,2048,8,256,1,1,power_law_1.01,1.6740480422973634
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,7168,2048,8,256,1,1,balanced,0.4251999855041504
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,7168,2048,8,256,1,1,balanced,2.726074536641439
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,7168,2048,8,256,1,1,balanced,5.326794624328613
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,6144,16384,2,8,1,1,power_law_1.2,18.611270141601562
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,7168,2048,8,256,1,1,power_law_1.01,2.3813568115234376
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,7168,2048,8,256,1,1,balanced,2.7660481135050454
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,7168,2048,8,256,1,1,balanced,0.7327626546223959
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,7168,2048,8,256,1,1,balanced,5.366682688395183
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,7168,2048,8,256,1,1,balanced,2.7852160135904946
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,7168,2048,8,256,1,1,power_law_1.01,0.1352895975112915
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,7168,2048,8,256,1,1,power_law_1.01,3.3934398651123048
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,7168,2048,8,256,1,1,balanced,1.3909173011779785
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,7168,2048,8,256,1,1,balanced,2.8745972315470376
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,6144,16384,2,8,1,1,power_law_1.2,25.943142700195313
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,7168,2048,8,256,1,1,balanced,5.402608235677083
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,7168,2048,8,256,1,1,power_law_1.01,0.20614399909973144
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,7168,2048,8,256,1,1,power_law_1.01,3.8228481292724608
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,7168,2048,8,256,1,1,balanced,2.699376106262207
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,7168,2048,8,256,1,1,balanced,2.9636052449544272
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,7168,2048,8,256,1,1,power_law_1.01,0.23420801162719726
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,7168,2048,8,256,1,1,balanced,2.710346539815267
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,7168,2048,8,256,1,1,power_law_1.01,3.847001647949219
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,7168,2048,8,256,1,1,balanced,5.660570780436198
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,7168,2048,8,256,1,1,balanced,2.991941452026367
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,6144,16384,2,8,1,1,power_law_1.2,33.28581848144531
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,7168,2048,8,256,1,1,balanced,2.7234878540039062
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,7168,2048,8,256,1,1,power_law_1.01,0.5207039833068847
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,7168,2048,8,256,1,1,power_law_1.01,4.034207916259765
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,7168,2048,8,256,1,1,balanced,5.740261077880859
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,7168,2048,8,256,1,1,balanced,3.0899359385172525
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,7168,2048,8,256,1,1,balanced,2.724933306376139
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,7168,2048,8,256,1,1,power_law_1.01,0.8739007949829102
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,7168,2048,8,256,1,1,power_law_1.01,4.126937484741211
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,7168,2048,8,256,1,1,balanced,2.7434345881144204
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,7168,2048,8,256,1,1,power_law_1.01,1.235910415649414
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,7168,2048,8,256,1,1,balanced,5.901914596557617
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,7168,2048,8,256,1,1,balanced,3.2783358891805015
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,7168,2048,8,256,1,1,power_law_1.01,4.191743850708008
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,7168,2048,8,256,1,1,balanced,2.7602933247884116
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,7168,2048,8,256,1,1,power_law_1.01,1.6750207901000977
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,6144,16384,2,8,1,1,power_law_1.2,54.484246826171876
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,7168,2048,8,256,1,1,power_law_1.01,4.275929641723633
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,7168,2048,8,256,1,1,balanced,6.1499678293863935
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,7168,2048,8,256,1,1,balanced,3.557861328125
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,7168,2048,8,256,1,1,balanced,2.7774985631306968
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,7168,2048,8,256,1,1,power_law_1.01,1.9275327682495118
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,7168,2048,8,256,1,1,power_law_1.01,4.662598419189453
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,7168,2048,8,256,1,1,balanced,2.803018569946289
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,7168,2048,8,256,1,1,power_law_1.01,0.19544960260391236
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,7168,2048,8,256,1,1,power_law_1.01,1.9976831436157227
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,7168,2048,8,256,1,1,power_law_1.01,4.72405776977539
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,7168,2048,8,256,1,1,balanced,6.479925155639648
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,7168,2048,8,256,1,1,balanced,3.784677187601725
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,7168,2048,8,256,1,1,balanced,2.841829299926758
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,7168,2048,8,256,1,1,power_law_1.01,0.26965761184692383
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,7168,2048,8,256,1,1,power_law_1.01,2.0187200546264648
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,7168,2048,8,256,1,1,power_law_1.01,4.9644416809082035
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,7168,2048,8,256,1,1,power_law_1.01,0.2866624116897583
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,7168,2048,8,256,1,1,balanced,2.8998613357543945
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,7168,2048,8,256,1,1,power_law_1.01,2.1396608352661133
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,7168,2048,8,256,1,1,power_law_1.01,4.975827026367187
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,7168,2048,8,256,1,1,power_law_1.01,0.5529151916503906
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,7168,2048,8,256,1,1,balanced,6.72764269510905
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,7168,2048,8,256,1,1,balanced,2.952453295389811
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,7168,2048,8,256,1,1,power_law_1.01,2.182547187805176
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,7168,2048,8,256,1,1,balanced,5.016378720601399
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,7168,2048,8,256,1,1,power_law_1.01,5.524288177490234
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,7168,2048,8,256,1,1,power_law_1.01,0.8659008026123047
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,7168,2048,8,256,1,1,power_law_1.01,2.2689535140991213
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,7168,2048,8,256,1,1,balanced,3.0346028010050454
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,6144,16384,2,8,1,1,power_law_1.2,115.27977294921875
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,7168,2048,8,256,1,1,power_law_1.01,1.2338111877441407
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,7168,2048,8,256,1,1,power_law_1.01,5.783731079101562
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,7168,2048,8,256,1,1,power_law_1.01,2.3410879135131837
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,7168,2048,8,256,1,1,balanced,8.362576166788736
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,7168,2048,8,256,1,1,power_law_1.01,1.8342208862304688
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,7168,2048,8,256,1,1,power_law_1.01,6.915846252441407
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,7168,2048,8,256,1,1,power_law_1.01,2.3644287109375
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,7168,2048,8,256,1,1,balanced,5.4144643147786455
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,7168,2048,8,256,1,1,power_law_1.01,1.9048063278198242
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,7168,2048,8,256,1,1,power_law_1.01,2.4246143341064452
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,7168,2048,8,256,1,1,power_law_1.01,6.149983978271484
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,7168,2048,8,256,1,1,power_law_1.01,2.0166784286499024
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,7168,2048,8,256,1,1,balanced,3.222890535990397
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,7168,2048,8,256,1,1,power_law_1.01,2.8143552780151366
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,7168,2048,8,256,1,1,power_law_1.01,7.193011474609375
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,7168,2048,8,256,1,1,power_law_1.01,2.108255958557129
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,7168,2048,8,256,1,1,balanced,8.986917495727539
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,7168,2048,8,256,1,1,power_law_1.01,3.333318328857422
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,7168,2048,8,256,1,1,power_law_1.01,2.1664384841918944
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,7168,2048,8,256,1,1,power_law_1.01,8.099494171142577
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,7168,2048,8,256,1,1,balanced,7.540085474650065
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,7168,2048,8,256,1,1,power_law_1.01,3.1757312774658204
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,7168,2048,8,256,1,1,power_law_1.01,2.37825927734375
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,7168,2048,8,256,1,1,power_law_1.01,10.095206451416015
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,7168,2048,8,256,1,1,power_law_1.01,3.7646656036376953
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,7168,2048,8,256,1,1,power_law_1.01,2.489695930480957
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,7168,2048,8,256,1,1,power_law_1.01,11.854662322998047
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,7168,2048,8,256,1,1,power_law_1.01,3.379238510131836
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,7168,2048,8,256,1,1,power_law_1.01,2.7387840270996096
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,256,1,1,balanced,3.413087844848633
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,7168,2048,8,256,1,1,balanced,12.5088742574056
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,7168,2048,8,256,1,1,power_law_1.01,3.866969680786133
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,7168,2048,8,256,1,1,power_law_1.01,15.930776977539063
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,7168,2048,8,256,1,1,power_law_1.01,2.9944896697998047
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,256,1,1,balanced,3.7491305669148765
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,7168,2048,8,256,1,1,power_law_1.01,4.509856033325195
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,7168,2048,8,256,1,1,power_law_1.01,3.218860626220703
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,7168,2048,8,256,1,1,power_law_1.01,20.624114990234375
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,7168,2048,8,256,1,1,balanced,10.172463734944662
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,7168,2048,8,256,1,1,power_law_1.01,5.576038360595703
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,256,1,1,balanced,4.080186525980632
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,7168,2048,8,256,1,1,power_law_1.01,3.6976703643798827
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,7168,2048,8,256,1,1,power_law_1.01,6.938432312011718
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,7168,2048,8,256,1,1,power_law_1.01,24.413005065917968
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,256,1,1,balanced,4.954554557800293
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,7168,2048,8,256,1,1,power_law_1.01,9.26503677368164
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,7168,2048,8,256,1,1,power_law_1.01,3.8772544860839844
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,7168,2048,8,256,1,1,balanced,16.921588897705078
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,7168,2048,8,256,1,1,power_law_1.01,11.772447967529297
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,256,1,1,balanced,5.4737122853597
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,7168,2048,8,256,1,1,power_law_1.01,36.132363891601564
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,256,1,1,power_law_1.01,3.5159358978271484
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,7168,2048,8,256,1,1,power_law_1.01,14.616908264160156
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,256,1,1,power_law_1.01,4.350009536743164
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,7168,2048,8,256,1,1,balanced,12.346319834391275
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,256,1,1,balanced,9.196650822957357
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,256,1,1,power_law_1.01,5.093356704711914
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,7168,2048,8,256,1,1,power_law_1.01,21.440243530273438
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,256,1,1,power_law_1.01,5.73370246887207
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,7168,2048,8,256,1,1,power_law_1.01,67.77561645507812
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,256,1,1,power_law_1.01,6.996243286132812
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,7168,2048,8,256,1,1,balanced,19.858768463134766
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,256,1,1,balanced,10.558005650838217
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,7168,2048,8,256,1,1,power_law_1.01,39.82616271972656
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,256,1,1,power_law_1.01,9.584518432617188
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,256,1,1,power_law_1.01,12.114265441894531
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,256,1,1,power_law_1.01,17.669024658203124
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,256,1,1,balanced,15.94760004679362
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,256,1,1,power_law_1.01,23.047628784179686
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,7168,2048,8,256,1,1,balanced,19.234181722005207
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,256,1,1,power_law_1.01,28.746829223632812
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,7168,2048,8,256,1,1,balanced,31.921946207682293
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,256,1,1,power_law_1.01,44.89429626464844
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,256,1,1,balanced,21.947525024414062
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,256,1,1,power_law_1.01,91.33914184570312
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,256,1,1,balanced,27.508010864257812
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,7168,2048,8,256,1,1,power_law_1.2,0.22339839935302735
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,7168,2048,8,256,1,1,power_law_1.2,0.3547071933746338
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,7168,2048,8,256,1,1,power_law_1.2,0.4379712104797363
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,7168,2048,8,256,1,1,power_law_1.2,0.8966015815734864
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,7168,2048,8,256,1,1,balanced,39.063209533691406
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,7168,2048,8,256,1,1,power_law_1.2,1.4249728202819825
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,7168,2048,8,256,1,1,power_law_1.2,2.0531455993652346
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,7168,2048,8,256,1,1,power_law_1.2,3.427257537841797
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,7168,2048,8,256,1,1,power_law_1.2,3.6329086303710936
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,7168,2048,8,256,1,1,power_law_1.2,3.9019134521484373
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,256,1,1,balanced,46.21544901529948
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,7168,2048,8,256,1,1,power_law_1.2,3.9801025390625
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,7168,2048,8,256,1,1,balanced,64.18533325195312
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,7168,2048,8,256,1,1,power_law_1.2,4.181619262695312
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,7168,2048,8,256,1,1,power_law_1.2,4.195955276489258
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,7168,2048,8,256,1,1,power_law_1.2,4.390694427490234
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,7168,2048,8,256,1,1,power_law_1.2,4.7707263946533205
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,7168,2048,8,256,1,1,power_law_1.2,4.935404968261719
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,7168,2048,8,256,1,1,power_law_1.2,5.312742233276367
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,7168,2048,8,256,1,1,power_law_1.2,0.12443519830703735
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,7168,2048,8,256,1,1,power_law_1.2,5.179244613647461
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,7168,2048,8,256,1,1,power_law_1.2,0.20369279384613037
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,7168,2048,8,256,1,1,power_law_1.2,0.2381056070327759
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,7168,2048,8,256,1,1,power_law_1.2,5.928384017944336
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,7168,2048,8,256,1,1,power_law_1.2,0.49448318481445314
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,7168,2048,8,256,1,1,power_law_1.2,6.310758590698242
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,7168,2048,8,256,1,1,power_law_1.2,0.7560704231262207
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,7168,2048,8,256,1,1,power_law_1.2,1.0601920127868651
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,7168,2048,8,256,1,1,power_law_1.2,7.3207038879394535
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,7168,2048,8,256,1,1,power_law_1.2,1.6784255981445313
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,7168,2048,8,256,1,1,power_law_1.2,6.681088256835937
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,7168,2048,8,256,1,1,power_law_1.2,1.855571174621582
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,7168,2048,8,256,1,1,power_law_1.2,1.9463935852050782
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,7168,2048,8,256,1,1,power_law_1.2,7.521932983398438
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,7168,2048,8,256,1,1,power_law_1.2,1.989356803894043
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,7168,2048,8,256,1,1,power_law_1.2,8.624838256835938
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,7168,2048,8,256,1,1,power_law_1.2,2.122195243835449
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,7168,2048,8,256,1,1,power_law_1.2,2.163814353942871
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,7168,2048,8,256,1,1,power_law_1.2,10.556403350830077
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,7168,2048,8,256,1,1,power_law_1.2,2.249363136291504
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,7168,2048,8,256,1,1,power_law_1.2,2.2920000076293947
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,7168,2048,8,256,1,1,power_law_1.2,12.515071868896484
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,7168,2048,8,256,1,1,power_law_1.2,2.4278591156005858
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,7168,2048,8,256,1,1,power_law_1.2,2.600057601928711
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,7168,2048,8,256,1,1,power_law_1.2,17.067135620117188
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,7168,2048,8,256,1,1,power_law_1.2,3.1185024261474608
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,256,1,1,balanced,91.76400756835938
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,7168,2048,8,256,1,1,power_law_1.2,3.521452713012695
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,7168,2048,8,256,1,1,power_law_1.2,20.750119018554688
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,7168,2048,8,256,1,1,power_law_1.2,3.263014221191406
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,7168,2048,8,256,1,1,power_law_1.2,0.18808319568634033
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,7168,2048,8,256,1,1,power_law_1.2,3.9529792785644533
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,7168,2048,8,256,1,1,power_law_1.2,24.813612365722655
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,7168,2048,8,256,1,1,power_law_1.2,0.26892800331115724
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,7168,2048,8,256,1,1,power_law_1.2,3.5628734588623048
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,7168,2048,8,256,1,1,power_law_1.2,0.28078720569610593
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,7168,2048,8,256,1,1,power_law_1.2,4.168371200561523
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,7168,2048,8,256,1,1,power_law_1.2,35.760595703125
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,7168,2048,8,256,1,1,power_law_1.2,0.5006464004516602
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,2048,768,8,128,1,1,balanced,0.045461331804593406
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,7168,2048,8,256,1,1,power_law_1.2,4.737171173095703
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,7168,2048,8,256,1,1,power_law_1.2,0.7659200191497803
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,2048,768,8,128,1,1,balanced,0.060693333546320595
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,7168,2048,8,256,1,1,power_law_1.2,5.882841491699219
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,7168,2048,8,256,1,1,power_law_1.2,1.127347183227539
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,2048,768,8,128,1,1,balanced,0.09655466675758362
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,7168,2048,8,256,1,1,power_law_1.2,7.229164886474609
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,2048,768,8,128,1,1,balanced,0.1664426624774933
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,7168,2048,8,256,1,1,power_law_1.2,1.7362239837646485
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,2048,768,8,128,1,1,balanced,0.30508800347646076
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,7168,2048,8,256,1,1,power_law_1.2,1.9267072677612305
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,7168,2048,8,256,1,1,power_law_1.2,68.3344970703125
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,7168,2048,8,256,1,1,power_law_1.2,9.631302642822266
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,2048,768,8,128,1,1,balanced,0.3070773283640544
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,7168,2048,8,256,1,1,power_law_1.2,1.9316287994384767
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,2048,768,8,128,1,1,balanced,0.31070399284362793
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,7168,2048,8,256,1,1,power_law_1.2,12.326380920410156
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,2048,768,8,128,1,1,balanced,0.30887999137242633
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,7168,2048,8,256,1,1,power_law_1.2,2.068704032897949
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,2048,768,8,128,1,1,balanced,0.31090132395426434
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,7168,2048,8,256,1,1,power_law_1.2,2.1555904388427733
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,7168,2048,8,256,1,1,power_law_1.2,15.006489562988282
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,2048,768,8,128,1,1,balanced,0.31302400430043537
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,7168,2048,8,256,1,1,power_law_1.2,2.3655679702758787
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,2048,768,8,128,1,1,balanced,0.31760533650716144
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,7168,2048,8,256,1,1,power_law_1.2,2.5767040252685547
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,7168,2048,8,256,1,1,power_law_1.2,21.811827087402342
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,2048,768,8,128,1,1,balanced,0.3198240001996358
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,7168,2048,8,256,1,1,power_law_1.2,2.7907583236694338
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,2048,768,8,128,1,1,balanced,0.3216266632080078
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,7168,2048,8,256,1,1,power_law_1.2,3.04833927154541
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,2048,768,8,128,1,1,balanced,0.3266879916191101
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,7168,2048,8,256,1,1,power_law_1.2,3.3330303192138673
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,2048,768,8,128,1,1,balanced,0.34244799613952637
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,7168,2048,8,256,1,1,power_law_1.2,40.6581298828125
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,2048,768,8,128,1,1,balanced,0.34905068079630536
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,7168,2048,8,256,1,1,power_law_1.2,3.7293121337890627
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,2048,768,8,128,1,1,balanced,0.36368000507354736
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,2048,768,8,128,1,1,balanced,0.39310399691263836
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,7168,2048,8,256,1,1,power_law_1.2,3.9672000885009764
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,2048,768,8,128,1,1,balanced,0.4150186777114868
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,2048,768,8,128,1,1,balanced,0.4543360074361165
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,256,1,1,power_law_1.2,3.715488052368164
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,2048,768,8,128,1,1,balanced,0.038773333032925926
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,256,1,1,power_law_1.2,4.494208145141601
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,2048,768,8,128,1,1,balanced,0.49010133743286133
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,2048,768,8,128,1,1,balanced,0.050069332122802734
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,256,1,1,power_law_1.2,5.241702270507813
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,2048,768,8,128,1,1,balanced,0.06846933563550313
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,2048,768,8,128,1,1,balanced,0.6690026919047037
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,2048,768,8,128,1,1,balanced,0.10763200124104817
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,256,1,1,power_law_1.2,5.969913482666016
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,2048,768,8,128,1,1,balanced,0.17803200085957846
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,2048,768,8,128,1,1,balanced,0.7422560056050619
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,256,1,1,power_law_1.2,7.293138885498047
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,2048,768,8,128,1,1,balanced,0.18162665764490762
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,2048,768,8,128,1,1,balanced,0.18436266978581747
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,256,1,1,power_law_1.2,9.716627502441407
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,2048,768,8,128,1,1,balanced,0.18525334199269614
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,2048,768,8,128,1,1,balanced,0.18680532773335776
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,2048,768,8,128,1,1,balanced,1.0448906421661377
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,256,1,1,power_law_1.2,12.326406097412109
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,2048,768,8,128,1,1,balanced,0.18800532817840576
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,2048,768,8,128,1,1,balanced,0.19116799036661783
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,256,1,1,power_law_1.2,17.48039093017578
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,2048,768,8,128,1,1,balanced,0.19311465819676718
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,2048,768,8,128,1,1,balanced,0.197978675365448
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,2048,768,8,128,1,1,balanced,0.06453333298365276
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,2048,768,8,128,1,1,balanced,1.3383253415425618
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,2048,768,8,128,1,1,balanced,0.20459733406702676
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,256,1,1,power_law_1.2,22.883763122558594
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,2048,768,8,128,1,1,balanced,0.07100266714890797
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,2048,768,8,128,1,1,balanced,0.21380800008773804
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,2048,768,8,128,1,1,balanced,0.08158933122952779
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,2048,768,8,128,1,1,balanced,0.21917865673700967
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,2048,768,8,128,1,1,balanced,0.12097066640853882
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,256,1,1,power_law_1.2,28.237240600585938
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,2048,768,8,128,1,1,balanced,0.18825600544611612
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,2048,768,8,128,1,1,balanced,0.23938665787378946
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,2048,768,8,128,1,1,balanced,0.19368000825246176
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,2048,768,8,128,1,1,balanced,0.2640213370323181
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,2048,768,8,128,1,1,balanced,1.9457333882649739
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,2048,768,8,128,1,1,balanced,0.19591999053955078
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,2048,768,8,128,1,1,power_law_1.01,0.0433023989200592
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,2048,768,8,128,1,1,balanced,0.1975626746813456
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,2048,768,8,128,1,1,balanced,0.29602666695912677
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,256,1,1,power_law_1.2,44.80433959960938
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,2048,768,8,128,1,1,balanced,0.20200000206629434
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,2048,768,8,128,1,1,power_law_1.01,0.04772480130195618
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,2048,768,8,128,1,1,balanced,0.20480533440907797
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,2048,768,8,128,1,1,balanced,0.3442933162053426
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,2048,768,8,128,1,1,power_law_1.01,0.07837439775466919
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,2048,768,8,128,1,1,power_law_1.01,0.1199679970741272
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,2048,768,8,128,1,1,balanced,0.20826667547225952
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,2048,768,8,128,1,1,power_law_1.01,0.15440640449523926
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,2048,768,8,128,1,1,balanced,0.39077866077423096
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,2048,768,8,128,1,1,balanced,0.2152106761932373
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,2048,768,8,128,1,1,power_law_1.01,0.25284481048583984
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,2048,768,8,128,1,1,power_law_1.01,0.26316161155700685
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,2048,768,8,128,1,1,balanced,0.21996800104777017
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,2048,768,8,128,1,1,power_law_1.01,0.27686400413513185
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,2048,768,8,128,1,1,balanced,0.5631253321965536
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,2048,768,8,128,1,1,balanced,0.23068799575169882
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,2048,768,8,128,1,1,balanced,2.5765973726908364
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,2048,768,8,128,1,1,power_law_1.01,0.2876863956451416
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,2048,768,8,128,1,1,power_law_1.01,0.29053440093994143
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,256,1,1,power_law_1.2,88.39315185546874
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,2048,768,8,128,1,1,power_law_1.01,0.30424959659576417
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,2048,768,8,128,1,1,balanced,0.6546133359273275
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,2048,768,8,128,1,1,power_law_1.01,0.3119424104690552
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,2048,768,8,128,1,1,power_law_1.01,0.3179392099380493
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,2048,768,8,128,1,1,balanced,0.24986666440963745
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,2048,768,8,128,1,1,power_law_1.01,0.33219199180603026
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,2048,768,8,128,1,1,power_law_1.01,0.34885120391845703
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,2048,768,8,128,1,1,balanced,0.2577600081761678
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,2048,768,8,128,1,1,power_law_1.01,0.3663872003555298
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,2048,768,8,128,1,1,balanced,0.9534080028533936
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,2048,768,8,128,1,1,power_law_1.01,0.3844480037689209
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,2048,768,8,128,1,1,power_law_1.01,0.44733438491821287
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,2048,768,8,128,1,1,power_law_1.01,0.4492288112640381
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,2048,768,8,128,1,1,balanced,3.215786616007487
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,2048,768,8,128,1,1,power_law_1.01,0.5064511775970459
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,2048,768,8,128,1,1,power_law_1.01,0.570572805404663
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,2048,768,8,128,1,1,balanced,1.2612426280975342
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,2048,768,8,128,1,1,power_law_1.01,0.7170623779296875
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,2048,768,8,128,1,1,power_law_1.01,0.860319995880127
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,2048,768,8,128,1,1,balanced,0.29632000128428143
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,2048,768,8,128,1,1,power_law_1.01,1.1632320404052734
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,2048,768,8,128,1,1,balanced,0.3455679814020793
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,2048,768,8,128,1,1,power_law_1.01,1.462284755706787
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,2048,768,8,128,1,1,balanced,0.384554664293925
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,2048,768,8,128,1,1,power_law_1.01,2.059347152709961
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,2048,768,8,128,1,1,power_law_1.01,2.680588722229004
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,2048,768,8,128,1,1,balanced,0.5457173188527426
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,2048,768,8,128,1,1,balanced,1.8403786023457844
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,2048,768,8,128,1,1,power_law_1.01,3.298611068725586
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,2048,768,8,128,1,1,power_law_1.01,0.037273600697517395
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,2048,768,8,128,1,1,power_law_1.01,5.034745788574218
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,2048,768,8,128,1,1,balanced,0.6241439978281657
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,2048,768,8,128,1,1,power_law_1.01,0.03954559862613678
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,2048,768,8,128,1,1,power_law_1.01,0.058195197582244874
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,2048,768,8,128,1,1,power_law_1.01,10.332332611083984
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,2048,768,8,128,1,1,power_law_1.01,0.08054400086402894
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,2048,768,8,128,1,1,balanced,0.9512639840443929
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,2048,768,8,128,1,1,power_law_1.01,0.09976959824562073
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,2048,768,8,128,1,1,power_law_1.01,0.15559040307998656
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,2048,768,8,128,1,1,balanced,5.086837450663249
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,2048,768,8,128,1,1,balanced,2.436896006266276
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,2048,768,8,128,1,1,power_law_1.01,0.16001919507980347
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,2048,768,8,128,1,1,balanced,1.1283466815948486
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,2048,768,8,128,1,1,power_law_1.01,0.16442879438400268
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,2048,768,8,128,1,1,power_law_1.01,0.17593599557876588
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,2048,768,8,128,1,1,power_law_1.01,0.17669119834899902
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,2048,768,8,128,1,1,power_law_1.01,0.18724479675292968
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,2048,768,8,128,1,1,power_law_1.01,0.20247039794921876
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,2048,768,8,128,1,1,balanced,1.6436853408813477
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,2048,768,8,128,1,1,power_law_1.01,0.20713601112365723
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,2048,768,8,128,1,1,power_law_1.01,0.21340160369873046
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,2048,768,8,128,1,1,power_law_1.01,0.2221951961517334
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,2048,768,8,128,1,1,power_law_1.01,0.23340160846710206
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,2048,768,8,128,1,1,balanced,3.0467039744059243
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,2048,768,8,128,1,1,power_law_1.01,0.24315519332885743
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,2048,768,8,128,1,1,balanced,2.1767679850260415
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,2048,768,8,128,1,1,power_law_1.01,0.282207989692688
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,2048,768,8,128,1,1,power_law_1.01,0.3214656114578247
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,2048,768,8,128,1,1,power_law_1.01,0.3910144090652466
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,2048,768,8,128,1,1,power_law_1.01,0.054841601848602296
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,2048,768,8,128,1,1,power_law_1.01,0.4487040042877197
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,2048,768,8,128,1,1,power_law_1.01,0.06698240041732788
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,2048,768,8,128,1,1,power_law_1.01,0.5887936115264892
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,2048,768,8,128,1,1,power_law_1.01,0.07731840014457703
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,2048,768,8,128,1,1,power_law_1.01,0.7269951820373535
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,2048,768,8,128,1,1,balanced,3.202005386352539
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,2048,768,8,128,1,1,power_law_1.01,0.09560319781303406
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,2048,768,8,128,1,1,power_law_1.01,1.0092415809631348
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,2048,768,8,128,1,1,power_law_1.01,0.11215360164642334
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,2048,768,8,128,1,1,power_law_1.01,0.17080960273742676
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,2048,768,8,128,1,1,power_law_1.01,1.2816767692565918
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,2048,768,8,128,1,1,power_law_1.01,0.17403520345687867
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,2048,768,8,128,1,1,power_law_1.01,1.8500095367431642
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,2048,768,8,128,1,1,power_law_1.01,0.1834496021270752
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,2048,768,8,128,1,1,power_law_1.01,2.4505983352661134
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,2048,768,8,128,1,1,power_law_1.01,0.1966655969619751
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,2048,768,8,128,1,1,power_law_1.01,0.19704320430755615
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,2048,768,8,128,1,1,power_law_1.01,3.013907241821289
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,2048,768,8,128,1,1,balanced,4.81553586324056
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,2048,768,8,128,1,1,balanced,4.249375979105632
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,2048,768,8,128,1,1,power_law_1.01,0.21166720390319824
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,2048,768,8,128,1,1,power_law_1.01,4.715846252441406
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,2048,768,8,128,1,1,power_law_1.01,0.2259455919265747
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,2048,768,8,128,1,1,power_law_1.2,0.043136000633239746
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,2048,768,8,128,1,1,balanced,10.084239959716797
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,2048,768,8,128,1,1,power_law_1.01,0.23549439907073974
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,2048,768,8,128,1,1,power_law_1.01,9.6984130859375
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,2048,768,8,128,1,1,power_law_1.2,0.04695039987564087
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,2048,768,8,128,1,1,power_law_1.01,0.25939838886260985
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,2048,768,8,128,1,1,power_law_1.2,0.06376960277557372
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,2048,768,8,128,1,1,power_law_1.2,0.10321279764175414
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,2048,768,8,128,1,1,power_law_1.01,0.27241599559783936
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,2048,768,8,128,1,1,power_law_1.2,0.14979840517044068
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,2048,768,8,128,1,1,power_law_1.2,0.2537856101989746
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,2048,768,8,128,1,1,power_law_1.01,0.29119999408721925
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,2048,768,8,128,1,1,power_law_1.2,0.2725248098373413
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,2048,768,8,128,1,1,balanced,5.287919998168945
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,2048,768,8,128,1,1,power_law_1.2,0.2823807954788208
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,2048,768,8,128,1,1,power_law_1.01,0.30462079048156737
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,2048,768,8,128,1,1,power_law_1.2,0.29434239864349365
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,2048,768,8,128,1,1,power_law_1.01,0.36187520027160647
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,2048,768,8,128,1,1,power_law_1.2,0.3032383918762207
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,2048,768,8,128,1,1,power_law_1.01,0.4353856086730957
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,2048,768,8,128,1,1,power_law_1.2,0.30598399639129636
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,2048,768,8,128,1,1,power_law_1.01,0.5828864097595214
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,2048,768,8,128,1,1,power_law_1.2,0.3165247917175293
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,2048,768,8,128,1,1,power_law_1.01,0.7145919799804688
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,2048,768,8,128,1,1,power_law_1.2,0.32274560928344725
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,2048,768,8,128,1,1,power_law_1.2,0.3384320020675659
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,2048,768,8,128,1,1,power_law_1.01,0.9804863929748535
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,2048,768,8,128,1,1,power_law_1.2,0.35545599460601807
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,2048,768,8,128,1,1,power_law_1.01,1.2379839897155762
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,2048,768,8,128,1,1,power_law_1.2,0.368287992477417
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,2048,768,8,128,1,1,power_law_1.01,1.7536191940307617
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,2048,768,8,128,1,1,power_law_1.2,0.3961087942123413
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,2048,768,8,128,1,1,power_law_1.01,2.269331169128418
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,2048,768,8,128,1,1,power_law_1.2,0.44999041557312014
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,2048,768,8,128,1,1,power_law_1.01,3.3210880279541017
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,2048,768,8,128,1,1,power_law_1.2,0.44994559288024905
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,2048,768,8,128,1,1,power_law_1.2,0.5140351772308349
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,2048,768,8,128,1,1,power_law_1.01,4.35032958984375
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,2048,768,8,128,1,1,balanced,8.428458531697592
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,2048,768,8,128,1,1,power_law_1.2,0.5838848114013672
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,2048,768,8,128,1,1,balanced,9.41975466410319
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,2048,768,8,128,1,1,power_law_1.01,5.398591995239258
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,2048,768,8,128,1,1,power_law_1.2,0.7474495887756347
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,2048,768,8,128,1,1,power_law_1.2,0.880288028717041
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,2048,768,8,128,1,1,power_law_1.01,8.523296356201172
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,2048,768,8,128,1,1,power_law_1.2,1.1850432395935058
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,2048,768,8,128,1,1,power_law_1.2,1.4776896476745605
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,2048,768,8,128,1,1,power_law_1.01,16.865458679199218
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,2048,768,8,128,1,1,power_law_1.2,0.03741439878940582
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,2048,768,8,128,1,1,power_law_1.2,2.0809024810791015
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,2048,768,8,128,1,1,power_law_1.2,0.04417920112609863
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,2048,768,8,128,1,1,power_law_1.2,2.722751998901367
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,2048,768,8,128,1,1,power_law_1.2,0.05475839972496033
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,2048,768,8,128,1,1,power_law_1.2,3.3353214263916016
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,2048,768,8,128,1,1,power_law_1.2,0.07560960054397584
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,2048,768,8,128,1,1,power_law_1.2,0.09000319838523865
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,2048,768,8,128,1,1,power_law_1.2,5.03581428527832
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,2048,768,8,128,1,1,power_law_1.2,0.15610239505767823
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,2048,768,8,128,1,1,power_law_1.2,0.15719679594039918
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,2048,768,8,128,1,1,power_law_1.2,10.43025894165039
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,2048,768,8,128,1,1,power_law_1.2,0.16741759777069093
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,2048,768,8,128,1,1,power_law_1.2,0.17541760206222534
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,2048,768,8,128,1,1,power_law_1.2,0.18191360235214232
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,2048,768,8,128,1,1,power_law_1.2,0.1922368049621582
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,2048,768,8,128,1,1,power_law_1.2,0.20339200496673585
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,2048,768,8,128,1,1,power_law_1.2,0.2145535945892334
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,2048,768,8,128,1,1,power_law_1.2,0.21222400665283203
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,2048,768,8,128,1,1,power_law_1.2,0.224236798286438
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,2048,768,8,128,1,1,power_law_1.2,0.239136004447937
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,2048,768,8,128,1,1,power_law_1.2,0.25109119415283204
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,2048,768,8,128,1,1,power_law_1.2,0.29110400676727294
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,2048,768,8,128,1,1,balanced,16.767349243164062
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,2048,768,8,128,1,1,power_law_1.2,0.3326591968536377
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,2048,768,8,128,1,1,power_law_1.2,0.3985599994659424
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,2048,768,8,128,1,1,power_law_1.2,0.46185598373413084
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,2048,768,8,128,1,1,power_law_1.2,0.5983551979064942
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,2048,768,8,128,1,1,power_law_1.2,0.05686399936676025
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,2048,768,8,128,1,1,power_law_1.2,0.729420804977417
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,2048,768,8,128,1,1,power_law_1.2,1.0046400070190429
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,2048,768,8,128,1,1,power_law_1.2,0.06630399823188782
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,2048,768,8,128,1,1,power_law_1.2,0.07454079985618592
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,2048,768,8,128,1,1,power_law_1.2,1.2861184120178222
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,2048,768,8,128,1,1,power_law_1.2,0.08954240083694458
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,2048,768,8,128,1,1,power_law_1.2,1.8545408248901367
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,2048,768,8,128,1,1,power_law_1.2,0.10455039739608765
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,2048,768,8,128,1,1,power_law_1.2,0.1663424015045166
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,2048,768,8,128,1,1,power_law_1.2,2.4459840774536135
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,2048,768,8,128,1,1,power_law_1.2,0.17959680557250976
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,2048,768,8,128,1,1,power_law_1.2,3.009836769104004
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,2048,768,8,128,1,1,power_law_1.2,0.18496639728546144
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,2048,768,8,128,1,1,power_law_1.2,0.19567359685897828
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,2048,768,8,128,1,1,power_law_1.2,4.695513534545898
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,2048,768,8,128,1,1,power_law_1.2,0.2044543981552124
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,2048,768,8,128,1,1,power_law_1.2,0.21328001022338866
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,2048,768,8,128,1,1,power_law_1.2,9.743929290771485
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,2048,768,8,128,1,1,power_law_1.2,0.2275968074798584
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,2048,768,8,128,1,1,power_law_1.2,0.23551359176635742
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,2048,768,8,128,1,1,power_law_1.2,0.2598400115966797
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,2048,768,8,128,1,1,power_law_1.2,0.2753472089767456
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,2048,768,8,128,1,1,power_law_1.2,0.296345591545105
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,2048,768,8,128,1,1,power_law_1.2,0.3060992002487183
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,2048,768,8,128,1,1,power_law_1.2,0.3685120105743408
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,2048,768,8,128,1,1,power_law_1.2,0.44069762229919435
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,2048,768,8,128,1,1,power_law_1.2,0.5914495944976806
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,2048,768,8,128,1,1,power_law_1.2,0.7276735782623291
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,2048,768,8,128,1,1,power_law_1.2,0.9852288246154786
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,4096,1536,8,128,1,1,balanced,0.09645332892735799
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,2048,768,8,128,1,1,power_law_1.2,1.250169563293457
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,4096,1536,8,128,1,1,balanced,0.16620799899101257
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,4096,1536,8,128,1,1,balanced,0.06982400019963582
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,4096,1536,8,128,1,1,balanced,0.3019040028254191
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,2048,768,8,128,1,1,power_law_1.2,1.7580991744995118
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,4096,1536,8,128,1,1,balanced,0.5837706724802653
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,4096,1536,8,128,1,1,balanced,0.10245333115259807
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,2048,768,8,128,1,1,power_law_1.2,2.2848384857177733
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,4096,1536,8,128,1,1,balanced,1.127301295598348
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,4096,1536,8,128,1,1,balanced,0.17140799760818481
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,2048,768,8,128,1,1,power_law_1.2,3.33001594543457
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,4096,1536,8,128,1,1,balanced,1.1390399932861328
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,4096,1536,8,128,1,1,balanced,0.3121760090192159
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,4096,1536,8,128,1,1,balanced,1.137445370356242
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,4096,1536,8,128,1,1,balanced,0.5986080169677734
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,2048,768,8,128,1,1,power_law_1.2,4.367596817016602
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,4096,1536,8,128,1,1,balanced,1.1395413080851238
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,4096,1536,8,128,1,1,balanced,0.5997013250986735
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,4096,1536,8,128,1,1,balanced,1.1451306343078613
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,2048,768,8,128,1,1,power_law_1.2,5.410412979125977
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,4096,1536,8,128,1,1,balanced,0.611573338508606
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,4096,1536,8,128,1,1,balanced,1.1539839903513591
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,4096,1536,8,128,1,1,balanced,0.6058346827824911
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,2048,768,8,128,1,1,power_law_1.2,8.556633758544923
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,4096,1536,8,128,1,1,balanced,1.1551733016967773
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,4096,1536,8,128,1,1,balanced,0.6135626633961996
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,4096,1536,8,128,1,1,balanced,0.6201920111974081
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,4096,1536,8,128,1,1,balanced,1.1644426981608074
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,2048,768,8,128,1,1,power_law_1.2,16.90453186035156
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,4096,1536,8,128,1,1,balanced,0.6315786838531494
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,4096,1536,8,128,1,1,balanced,1.1669066747029622
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,4096,1536,8,128,1,1,balanced,0.6384373505910238
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,4096,1536,8,128,1,1,balanced,1.17686931292216
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,4096,1536,8,128,1,1,balanced,0.6423840125401815
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,4096,1536,8,128,1,1,balanced,1.2235199610392253
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,4096,1536,8,128,1,1,balanced,0.6538559993108114
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,4096,1536,8,128,1,1,balanced,1.2358453273773193
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,4096,1536,8,128,1,1,balanced,0.6685226758321127
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,4096,1536,8,128,1,1,balanced,1.2766773700714111
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,4096,1536,8,128,1,1,balanced,0.6783626874287924
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,4096,1536,8,128,1,1,balanced,0.6991999944051107
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,4096,1536,8,128,1,1,balanced,1.3090986410776775
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,4096,1536,8,128,1,1,balanced,0.7427626450856527
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,4096,1536,8,128,1,1,balanced,1.3833492596944172
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,4096,1536,8,128,1,1,balanced,0.7913653055826823
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,4096,1536,8,128,1,1,power_law_1.01,0.09552000164985656
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,4096,1536,8,128,1,1,balanced,1.4484000205993652
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,4096,1536,8,128,1,1,power_law_1.01,0.11806080341339112
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,4096,1536,8,128,1,1,balanced,0.8660586675008138
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,4096,1536,8,128,1,1,power_law_1.01,0.2376960039138794
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,4096,1536,8,128,1,1,balanced,1.525935967763265
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,4096,1536,8,128,1,1,balanced,0.9414986769358317
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,4096,1536,8,128,1,1,power_law_1.01,0.3704319953918457
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,4096,1536,8,128,1,1,power_law_1.01,0.5124415874481201
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,4096,1536,8,128,1,1,power_law_1.01,0.9648832321166992
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,4096,1536,8,128,1,1,balanced,1.9664427439371746
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,4096,1536,8,128,1,1,balanced,1.2761653264363606
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,4096,1536,8,128,1,1,power_law_1.01,0.06606079936027527
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,4096,1536,8,128,1,1,power_law_1.01,0.9683199882507324
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,4096,1536,8,128,1,1,power_law_1.01,1.0189632415771483
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,4096,1536,8,128,1,1,power_law_1.01,0.08058239817619324
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,4096,1536,8,128,1,1,balanced,0.08777067065238953
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,4096,1536,8,128,1,1,power_law_1.01,1.0321663856506347
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,4096,1536,8,128,1,1,balanced,2.1125547091166177
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,4096,1536,8,128,1,1,balanced,1.4295786221822102
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,4096,1536,8,128,1,1,power_law_1.01,0.137990403175354
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,4096,1536,8,128,1,1,power_law_1.01,1.0643775939941407
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,4096,1536,8,128,1,1,balanced,0.12165866295496623
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,4096,1536,8,128,1,1,power_law_1.01,0.21266560554504393
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,4096,1536,8,128,1,1,power_law_1.01,1.1321151733398438
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,4096,1536,8,128,1,1,balanced,0.18353599309921265
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,4096,1536,8,128,1,1,power_law_1.01,1.1432255744934081
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,4096,1536,8,128,1,1,power_law_1.01,0.2931135892868042
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,4096,1536,8,128,1,1,balanced,0.3270453413327535
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,4096,1536,8,128,1,1,power_law_1.01,1.1903167724609376
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,4096,1536,8,128,1,1,power_law_1.01,0.48266239166259767
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,4096,1536,8,128,1,1,balanced,2.8996852238972983
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,4096,1536,8,128,1,1,balanced,0.6072479883829752
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,4096,1536,8,128,1,1,balanced,2.0080107053120932
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,4096,1536,8,128,1,1,power_law_1.01,1.202073574066162
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,4096,1536,8,128,1,1,power_law_1.01,0.5275904178619385
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,4096,1536,8,128,1,1,balanced,0.6136159896850586
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,4096,1536,8,128,1,1,power_law_1.01,1.2318079948425293
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,4096,1536,8,128,1,1,balanced,0.6178346474965414
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,4096,1536,8,128,1,1,power_law_1.01,0.533465576171875
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,4096,1536,8,128,1,1,power_law_1.01,1.253587245941162
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,4096,1536,8,128,1,1,balanced,0.6214826504389445
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,4096,1536,8,128,1,1,power_law_1.01,1.311628818511963
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,4096,1536,8,128,1,1,power_law_1.01,0.5470719814300538
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,4096,1536,8,128,1,1,balanced,0.6284053325653076
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,4096,1536,8,128,1,1,power_law_1.01,0.5447487831115723
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,4096,1536,8,128,1,1,balanced,3.85099188486735
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,4096,1536,8,128,1,1,power_law_1.01,1.4790911674499512
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,4096,1536,8,128,1,1,balanced,2.637610594431559
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,4096,1536,8,128,1,1,power_law_1.01,1.4452927589416504
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,4096,1536,8,128,1,1,power_law_1.01,0.5885056018829345
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,4096,1536,8,128,1,1,balanced,0.6346986691157023
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,4096,1536,8,128,1,1,power_law_1.01,1.6346431732177735
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,4096,1536,8,128,1,1,power_law_1.01,0.602297592163086
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,4096,1536,8,128,1,1,balanced,0.6435306469599406
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,4096,1536,8,128,1,1,power_law_1.01,1.823846435546875
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,4096,1536,8,128,1,1,power_law_1.01,0.6110015869140625
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,4096,1536,8,128,1,1,balanced,0.6574186484018961
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,4096,1536,8,128,1,1,power_law_1.01,2.23242244720459
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,4096,1536,8,128,1,1,power_law_1.01,0.6585408210754394
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,4096,1536,8,128,1,1,balanced,0.6688693364461263
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,4096,1536,8,128,1,1,power_law_1.01,2.7027711868286133
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,4096,1536,8,128,1,1,power_law_1.01,0.6820672035217286
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,4096,1536,8,128,1,1,balanced,0.6912960211435953
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,4096,1536,8,128,1,1,power_law_1.01,3.568511962890625
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,4096,1536,8,128,1,1,balanced,5.701712290445964
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,4096,1536,8,128,1,1,balanced,3.8873440424601235
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,4096,1536,8,128,1,1,power_law_1.01,0.7007359981536865
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,4096,1536,8,128,1,1,power_law_1.01,4.721484756469726
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,4096,1536,8,128,1,1,power_law_1.01,0.0916159987449646
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,4096,1536,8,128,1,1,power_law_1.01,0.7080959796905517
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,4096,1536,8,128,1,1,power_law_1.01,6.4443199157714846
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,4096,1536,8,128,1,1,power_law_1.01,0.09679359793663025
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,4096,1536,8,128,1,1,power_law_1.01,0.8051520347595215
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,4096,1536,8,128,1,1,power_law_1.01,8.232838439941407
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,4096,1536,8,128,1,1,power_law_1.01,0.15639679431915282
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,4096,1536,8,128,1,1,balanced,0.7154293060302734
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,4096,1536,8,128,1,1,power_law_1.01,0.8424575805664063
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,4096,1536,8,128,1,1,power_law_1.01,10.032524871826173
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,4096,1536,8,128,1,1,power_law_1.01,0.2230207920074463
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,4096,1536,8,128,1,1,power_law_1.01,0.9996992111206054
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,4096,1536,8,128,1,1,balanced,0.7339306672414144
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,4096,1536,8,128,1,1,power_law_1.01,0.2925503969192505
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,4096,1536,8,128,1,1,power_law_1.01,1.113644790649414
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,4096,1536,8,128,1,1,power_law_1.01,15.102854919433593
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,4096,1536,8,128,1,1,power_law_1.01,0.5094336032867431
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,4096,1536,8,128,1,1,power_law_1.01,1.4163519859313964
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,4096,1536,8,128,1,1,balanced,5.157269477844238
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,4096,1536,8,128,1,1,balanced,7.469045639038086
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,4096,1536,8,128,1,1,power_law_1.01,0.5520768165588379
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,4096,1536,8,128,1,1,power_law_1.01,1.708345603942871
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,4096,1536,8,128,1,1,power_law_1.01,0.5643328189849853
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,4096,1536,8,128,1,1,power_law_1.01,29.379653930664062
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,4096,1536,8,128,1,1,power_law_1.01,2.312281608581543
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,4096,1536,8,128,1,1,power_law_1.01,0.5805056095123291
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,4096,1536,8,128,1,1,power_law_1.01,2.8661376953125
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,4096,1536,8,128,1,1,power_law_1.01,0.601913595199585
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,4096,1536,8,128,1,1,power_law_1.01,0.6571775913238526
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,4096,1536,8,128,1,1,power_law_1.01,4.045548629760742
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,4096,1536,8,128,1,1,power_law_1.01,0.7038847923278808
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,4096,1536,8,128,1,1,balanced,0.8108800252278646
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,4096,1536,8,128,1,1,power_law_1.01,5.296825790405274
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,4096,1536,8,128,1,1,power_law_1.01,0.7337920188903808
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,4096,1536,8,128,1,1,balanced,0.9298346837361654
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,4096,1536,8,128,1,1,power_law_1.01,0.8064064025878906
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,4096,1536,8,128,1,1,power_law_1.01,6.513241577148437
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,4096,1536,8,128,1,1,balanced,1.0036533673604329
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,4096,1536,8,128,1,1,balanced,6.437952041625977
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,4096,1536,8,128,1,1,balanced,9.327407836914062
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,4096,1536,8,128,1,1,power_law_1.01,9.977439880371094
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,4096,1536,8,128,1,1,power_law_1.01,0.7786687850952149
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,4096,1536,8,128,1,1,balanced,1.3013599713643391
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,4096,1536,8,128,1,1,power_law_1.01,0.8287232398986817
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,4096,1536,8,128,1,1,balanced,1.438218593597412
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,4096,1536,8,128,1,1,power_law_1.01,20.729747009277343
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,4096,1536,8,128,1,1,power_law_1.2,0.09592959880828858
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,4096,1536,8,128,1,1,power_law_1.2,0.10713599920272827
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,4096,1536,8,128,1,1,power_law_1.01,0.8680255889892579
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,4096,1536,8,128,1,1,balanced,2.220970630645752
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,4096,1536,8,128,1,1,power_law_1.2,0.2129215955734253
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,4096,1536,8,128,1,1,power_law_1.01,1.0479552268981933
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,4096,1536,8,128,1,1,power_law_1.2,0.34364159107208253
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,4096,1536,8,128,1,1,power_law_1.2,0.4776447772979736
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,4096,1536,8,128,1,1,power_law_1.01,1.215219211578369
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,4096,1536,8,128,1,1,power_law_1.2,0.9377408027648926
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,4096,1536,8,128,1,1,balanced,2.556176026662191
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,4096,1536,8,128,1,1,power_law_1.2,0.9996543884277344
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,4096,1536,8,128,1,1,power_law_1.01,1.4275327682495118
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,4096,1536,8,128,1,1,power_law_1.2,1.0407360076904297
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,4096,1536,8,128,1,1,power_law_1.01,1.7405439376831056
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,4096,1536,8,128,1,1,power_law_1.2,1.0913472175598145
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,4096,1536,8,128,1,1,power_law_1.2,1.0866111755371093
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,4096,1536,8,128,1,1,power_law_1.01,2.338764762878418
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,4096,1536,8,128,1,1,balanced,3.7809120814005532
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,4096,1536,8,128,1,1,power_law_1.2,1.1374784469604493
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,4096,1536,8,128,1,1,power_law_1.2,1.1800576210021974
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,4096,1536,8,128,1,1,power_law_1.01,2.949830436706543
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,4096,1536,8,128,1,1,balanced,10.193024317423502
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,4096,1536,8,128,1,1,balanced,15.135098775227865
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,4096,1536,8,128,1,1,power_law_1.2,1.2315135955810548
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,4096,1536,8,128,1,1,power_law_1.01,4.160512161254883
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,4096,1536,8,128,1,1,power_law_1.2,1.2211711883544922
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,4096,1536,8,128,1,1,power_law_1.2,1.2562175750732423
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,4096,1536,8,128,1,1,power_law_1.01,5.382009506225586
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,4096,1536,8,128,1,1,power_law_1.2,1.3109375953674316
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,4096,1536,8,128,1,1,balanced,5.0087893803914385
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,4096,1536,8,128,1,1,power_law_1.2,1.3913920402526856
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,4096,1536,8,128,1,1,power_law_1.01,7.846835327148438
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,4096,1536,8,128,1,1,power_law_1.2,1.5270144462585449
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,4096,1536,8,128,1,1,power_law_1.2,1.497753620147705
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,4096,1536,8,128,1,1,power_law_1.01,10.31884765625
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,4096,1536,8,128,1,1,power_law_1.2,1.6620607376098633
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,4096,1536,8,128,1,1,power_law_1.2,1.882784080505371
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,4096,1536,8,128,1,1,power_law_1.01,12.803167724609375
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,4096,1536,8,128,1,1,power_law_1.2,2.3364416122436524
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,4096,1536,8,128,1,1,balanced,7.490245183308919
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,4096,1536,8,128,1,1,power_law_1.2,2.7594112396240233
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,4096,1536,8,128,1,1,power_law_1.01,20.413043212890624
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,4096,1536,8,128,1,1,power_law_1.2,3.647488021850586
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,4096,1536,8,128,1,1,power_law_1.2,4.7244415283203125
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,4096,1536,8,128,1,1,power_law_1.2,0.06666240096092224
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,4096,1536,8,128,1,1,power_law_1.2,6.448249816894531
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,4096,1536,8,128,1,1,power_law_1.01,41.25186462402344
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,4096,1536,8,128,1,1,power_law_1.2,0.0769536018371582
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,4096,1536,8,128,1,1,power_law_1.2,8.33399658203125
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,4096,1536,8,128,1,1,power_law_1.2,0.12399359941482543
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,4096,1536,8,128,1,1,power_law_1.2,10.281075286865235
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,4096,1536,8,128,1,1,power_law_1.2,0.17950079441070557
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,4096,1536,8,128,1,1,balanced,10.080026626586914
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,4096,1536,8,128,1,1,power_law_1.2,0.2560895919799805
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,4096,1536,8,128,1,1,power_law_1.2,15.175027465820312
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,4096,1536,8,128,1,1,power_law_1.2,0.4770048141479492
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,4096,1536,8,128,1,1,power_law_1.2,0.5272575855255127
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,4096,1536,8,128,1,1,power_law_1.2,0.5665088176727295
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,4096,1536,8,128,1,1,power_law_1.2,29.601766967773436
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,4096,1536,8,128,1,1,power_law_1.2,0.5637311935424805
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,4096,1536,8,128,1,1,power_law_1.2,0.5703936100006104
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,4096,1536,8,128,1,1,power_law_1.2,0.6021247863769531
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,4096,1536,8,128,1,1,power_law_1.2,0.6125184059143066
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,4096,1536,8,128,1,1,balanced,12.534469604492188
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,4096,1536,8,128,1,1,power_law_1.2,0.6360000133514404
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,4096,1536,8,128,1,1,balanced,19.90292231241862
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,4096,1536,8,128,1,1,balanced,28.86920420328776
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,4096,1536,8,128,1,1,power_law_1.2,0.6671487808227539
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,4096,1536,8,128,1,1,power_law_1.2,0.7047167778015136
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,4096,1536,8,128,1,1,power_law_1.2,0.7180992126464844
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,4096,1536,8,128,1,1,power_law_1.2,0.7314879894256592
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,4096,1536,8,128,1,1,power_law_1.2,0.8415360450744629
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,4096,1536,8,128,1,1,power_law_1.2,0.8800383567810058
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,4096,1536,8,128,1,1,power_law_1.2,1.032089614868164
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,4096,1536,8,128,1,1,power_law_1.2,1.139084815979004
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,4096,1536,8,128,1,1,power_law_1.2,1.4493247985839843
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,4096,1536,8,128,1,1,power_law_1.2,1.7491392135620116
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,4096,1536,8,128,1,1,power_law_1.2,2.335270309448242
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,4096,1536,8,128,1,1,balanced,20.550511678059895
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,4096,1536,8,128,1,1,power_law_1.2,2.905196762084961
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,4096,1536,8,128,1,1,power_law_1.2,4.107155227661133
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,4096,1536,8,128,1,1,power_law_1.2,5.4029182434082035
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,4096,1536,8,128,1,1,power_law_1.2,6.662477111816406
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,4096,1536,8,128,1,1,power_law_1.2,10.094124603271485
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,4096,1536,8,128,1,1,power_law_1.2,20.9612548828125
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,4096,1536,8,128,1,1,power_law_1.2,0.09167360067367554
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,4096,1536,8,128,1,1,power_law_1.2,0.09872639775276185
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,4096,1536,8,128,1,1,power_law_1.2,0.14292479753494264
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,4096,1536,8,128,1,1,power_law_1.2,0.2247999906539917
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,4096,1536,8,128,1,1,power_law_1.2,0.2640255928039551
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,4096,1536,8,128,1,1,power_law_1.2,0.5052927970886231
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,6144,2560,8,160,1,1,balanced,0.24158932765324911
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,4096,1536,8,128,1,1,power_law_1.2,0.5461120128631591
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,6144,2560,8,160,1,1,balanced,0.3887840112050374
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,4096,1536,8,128,1,1,power_law_1.2,0.5783167839050293
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,6144,2560,8,160,1,1,balanced,0.7235626379648844
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,4096,1536,8,128,1,1,power_law_1.2,0.6085887908935547
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,6144,2560,8,160,1,1,balanced,1.4148319562276204
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,4096,1536,8,128,1,1,balanced,41.306864420572914
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,4096,1536,8,128,1,1,power_law_1.2,0.6259712219238281
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,6144,2560,8,160,1,1,balanced,2.7980372111002603
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,4096,1536,8,128,1,1,power_law_1.2,0.6671487808227539
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,6144,2560,8,160,1,1,balanced,3.4850613276163735
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,4096,1536,8,128,1,1,power_law_1.2,0.702342414855957
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,6144,2560,8,160,1,1,balanced,3.5044425328572593
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,4096,1536,8,128,1,1,power_law_1.2,0.7453951835632324
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,6144,2560,8,160,1,1,balanced,3.5066506067911782
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,4096,1536,8,128,1,1,power_law_1.2,0.8175616264343262
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,6144,2560,8,160,1,1,balanced,3.5299787521362305
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,6144,2560,8,160,1,1,balanced,3.5253067016601562
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,4096,1536,8,128,1,1,power_law_1.2,0.7894783973693847
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,6144,2560,8,160,1,1,balanced,3.530751864115397
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,4096,1536,8,128,1,1,power_law_1.2,0.8517631530761719
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,6144,2560,8,160,1,1,balanced,3.5350348154703775
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,6144,2560,8,160,1,1,balanced,3.5491838455200195
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,4096,1536,8,128,1,1,power_law_1.2,0.884000015258789
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,6144,2560,8,160,1,1,balanced,3.5825653076171875
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,4096,1536,8,128,1,1,power_law_1.2,1.054150390625
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,6144,2560,8,160,1,1,balanced,3.5950133005777993
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,4096,1536,8,128,1,1,power_law_1.2,1.2345919609069824
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,4096,1536,8,128,1,1,power_law_1.2,1.4744256019592286
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,6144,2560,8,160,1,1,balanced,3.7263574600219727
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,4096,1536,8,128,1,1,power_law_1.2,1.7687616348266602
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,6144,2560,8,160,1,1,balanced,3.7786080042521157
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,4096,1536,8,128,1,1,power_law_1.2,2.368351936340332
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,6144,2560,8,160,1,1,balanced,3.8702398935953775
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,4096,1536,8,128,1,1,power_law_1.2,2.959552001953125
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,4096,1536,8,128,1,1,power_law_1.2,4.208601760864258
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,6144,2560,8,160,1,1,balanced,3.9022293090820312
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,4096,1536,8,128,1,1,power_law_1.2,5.415609741210938
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,6144,2560,8,160,1,1,balanced,0.1402613321940104
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,6144,2560,8,160,1,1,balanced,5.365669250488281
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,4096,1536,8,128,1,1,power_law_1.2,7.867584228515625
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,6144,2560,8,160,1,1,balanced,0.21613866090774536
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,6144,2560,8,160,1,1,balanced,0.3866719802220662
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,4096,1536,8,128,1,1,power_law_1.2,10.325510406494141
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,6144,2560,8,160,1,1,balanced,4.295365333557129
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,6144,2560,8,160,1,1,balanced,0.740997314453125
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,6144,2560,8,160,1,1,balanced,1.4295412699381511
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,6144,2560,8,160,1,1,balanced,1.7754507064819336
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,4096,1536,8,128,1,1,power_law_1.2,12.82529296875
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,6144,2560,8,160,1,1,balanced,1.781765302022298
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,6144,2560,8,160,1,1,balanced,8.667792002360025
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,6144,2560,8,160,1,1,balanced,1.7953599294026692
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,6144,2560,8,160,1,1,balanced,1.82040007909139
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,4096,1536,8,128,1,1,power_law_1.2,20.339244079589843
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,6144,2560,8,160,1,1,balanced,1.8205386797587078
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,6144,2560,8,160,1,1,balanced,5.514058430989583
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,6144,2560,8,160,1,1,balanced,1.8296747207641602
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,6144,2560,8,160,1,1,balanced,1.8480532964070637
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,6144,2560,8,160,1,1,balanced,1.8531413078308105
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,6144,2560,8,160,1,1,balanced,1.8897333145141602
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,4096,1536,8,128,1,1,power_law_1.2,40.62504272460937
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,6144,2560,8,160,1,1,balanced,1.9099574089050293
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,6144,2560,8,160,1,1,balanced,10.661712010701498
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,6144,2560,8,160,1,1,balanced,1.9283092816670735
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,6144,2560,8,160,1,1,balanced,1.9711839358011882
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,6144,2560,8,160,1,1,balanced,2.082848072052002
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,6144,2560,8,160,1,1,balanced,2.074570655822754
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,6144,2560,8,160,1,1,balanced,0.16582399606704712
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,6144,2560,8,160,1,1,balanced,10.562906901041666
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,6144,2560,8,160,1,1,balanced,3.064101219177246
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,6144,2560,8,160,1,1,balanced,0.24212799469629923
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,6144,2560,8,160,1,1,power_law_1.01,0.22276480197906495
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,6144,2560,8,160,1,1,balanced,0.41553600629170734
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,6144,2560,8,160,1,1,balanced,2.3124106725056968
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,6144,2560,8,160,1,1,power_law_1.01,0.1391487956047058
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,6144,2560,8,160,1,1,balanced,0.7629173596700033
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,6144,2560,8,160,1,1,power_law_1.01,0.3416703939437866
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,6144,2560,8,160,1,1,balanced,4.199605305989583
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,6144,2560,8,160,1,1,power_law_1.01,0.18723200559616088
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,6144,2560,8,160,1,1,balanced,1.4456532796223958
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,6144,2560,8,160,1,1,power_law_1.01,0.5637695789337158
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,6144,2560,8,160,1,1,power_law_1.01,0.2849728107452393
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,6144,2560,8,160,1,1,balanced,1.8020000457763672
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,6144,2560,8,160,1,1,power_law_1.01,1.0445119857788085
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,6144,2560,8,160,1,1,balanced,3.1780214309692383
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,6144,2560,8,160,1,1,power_law_1.01,0.5030079841613769
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,6144,2560,8,160,1,1,balanced,1.8083465894063313
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,6144,2560,8,160,1,1,balanced,16.017903645833332
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,6144,2560,8,160,1,1,power_law_1.01,1.4142208099365234
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,6144,2560,8,160,1,1,power_law_1.01,0.7369408130645752
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,6144,2560,8,160,1,1,balanced,1.8166507085164387
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,6144,2560,8,160,1,1,power_law_1.01,2.528851127624512
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,6144,2560,8,160,1,1,power_law_1.01,1.382528018951416
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,6144,2560,8,160,1,1,balanced,1.8257333437601726
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,6144,2560,8,160,1,1,power_law_1.01,2.772185516357422
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,6144,2560,8,160,1,1,balanced,5.761333465576172
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,6144,2560,8,160,1,1,power_law_1.01,1.4539263725280762
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,6144,2560,8,160,1,1,balanced,1.8330186208089192
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,6144,2560,8,160,1,1,power_law_1.01,2.942630386352539
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,6144,2560,8,160,1,1,balanced,1.8528745969136555
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,6144,2560,8,160,1,1,power_law_1.01,1.4992128372192384
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,6144,2560,8,160,1,1,power_law_1.01,3.014022445678711
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,6144,2560,8,160,1,1,balanced,1.8715359369913738
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,6144,2560,8,160,1,1,power_law_1.01,1.5919808387756347
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,6144,2560,8,160,1,1,balanced,1.88919464747111
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,6144,2560,8,160,1,1,power_law_1.01,3.082259178161621
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,6144,2560,8,160,1,1,power_law_1.01,1.6304767608642579
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,6144,2560,8,160,1,1,balanced,5.983397165934245
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,6144,2560,8,160,1,1,balanced,1.9285653432210286
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,6144,2560,8,160,1,1,power_law_1.01,1.6348159790039063
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,6144,2560,8,160,1,1,power_law_1.01,3.1003904342651367
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,6144,2560,8,160,1,1,balanced,24.095807393391926
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,6144,2560,8,160,1,1,balanced,1.977509339650472
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,6144,2560,8,160,1,1,power_law_1.01,1.7038591384887696
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,6144,2560,8,160,1,1,power_law_1.01,3.2421375274658204
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,6144,2560,8,160,1,1,power_law_1.01,1.7355840682983399
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,6144,2560,8,160,1,1,power_law_1.01,3.2943870544433596
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,6144,2560,8,160,1,1,power_law_1.01,1.7411327362060547
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,6144,2560,8,160,1,1,power_law_1.01,3.4766464233398438
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,6144,2560,8,160,1,1,balanced,8.89195187886556
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,6144,2560,8,160,1,1,power_law_1.01,1.8784320831298829
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,6144,2560,8,160,1,1,balanced,2.029226620992025
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,6144,2560,8,160,1,1,power_law_1.01,3.7369537353515625
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,6144,2560,8,160,1,1,power_law_1.01,1.9348224639892577
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,6144,2560,8,160,1,1,power_law_1.01,3.829600143432617
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,6144,2560,8,160,1,1,power_law_1.01,2.005574417114258
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,6144,2560,8,160,1,1,power_law_1.01,3.782649612426758
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,6144,2560,8,160,1,1,power_law_1.01,2.2590784072875976
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,6144,2560,8,160,1,1,power_law_1.01,4.119993591308594
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,6144,2560,8,160,1,1,power_law_1.01,0.1690559983253479
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,6144,2560,8,160,1,1,balanced,2.118096033732096
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,6144,2560,8,160,1,1,power_law_1.01,2.497727966308594
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,6144,2560,8,160,1,1,balanced,22.757334391276043
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,6144,2560,8,160,1,1,power_law_1.01,5.098342514038086
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,6144,2560,8,160,1,1,power_law_1.01,0.23248000144958497
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,6144,2560,8,160,1,1,balanced,11.071914672851562
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,6144,2560,8,160,1,1,power_law_1.01,2.894623947143555
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,6144,2560,8,160,1,1,power_law_1.01,0.32419838905334475
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,6144,2560,8,160,1,1,power_law_1.01,6.345619201660156
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,6144,2560,8,160,1,1,power_law_1.01,0.5586431980133056
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,6144,2560,8,160,1,1,power_law_1.01,3.265875244140625
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,6144,2560,8,160,1,1,power_law_1.01,6.677734375
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,6144,2560,8,160,1,1,power_law_1.01,0.7802624225616455
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,6144,2560,8,160,1,1,power_law_1.01,3.986783981323242
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,6144,2560,8,160,1,1,power_law_1.01,1.388435173034668
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,6144,2560,8,160,1,1,power_law_1.01,8.292205047607421
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,6144,2560,8,160,1,1,power_law_1.01,4.530771255493164
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,6144,2560,8,160,1,1,power_law_1.01,1.4847359657287598
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,6144,2560,8,160,1,1,power_law_1.01,8.298310089111329
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,6144,2560,8,160,1,1,power_law_1.01,5.687788772583008
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,6144,2560,8,160,1,1,power_law_1.01,1.5623295783996582
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,6144,2560,8,160,1,1,balanced,2.3115893999735513
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,6144,2560,8,160,1,1,power_law_1.01,10.268172454833984
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,6144,2560,8,160,1,1,power_law_1.01,1.6302976608276367
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,6144,2560,8,160,1,1,power_law_1.01,6.8172607421875
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,6144,2560,8,160,1,1,balanced,2.4650932947794595
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,6144,2560,8,160,1,1,balanced,12.56112543741862
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,6144,2560,8,160,1,1,power_law_1.01,1.643903923034668
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,6144,2560,8,160,1,1,power_law_1.01,12.265631866455077
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,6144,2560,8,160,1,1,power_law_1.01,9.184486389160156
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,6144,2560,8,160,1,1,balanced,2.8463573455810547
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,6144,2560,8,160,1,1,power_law_1.01,1.776812744140625
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,6144,2560,8,160,1,1,power_law_1.01,1.906662368774414
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,6144,2560,8,160,1,1,power_law_1.2,0.22451200485229492
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,6144,2560,8,160,1,1,power_law_1.01,11.134528350830077
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,6144,2560,8,160,1,1,power_law_1.01,16.22380828857422
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,6144,2560,8,160,1,1,balanced,3.1388587951660156
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,6144,2560,8,160,1,1,power_law_1.01,2.0105024337768556
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,6144,2560,8,160,1,1,power_law_1.2,0.24841599464416503
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,6144,2560,8,160,1,1,power_law_1.01,13.793055725097656
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,6144,2560,8,160,1,1,power_law_1.01,2.2745344161987306
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,6144,2560,8,160,1,1,power_law_1.2,0.49836158752441406
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,6144,2560,8,160,1,1,power_law_1.01,21.837107849121093
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,6144,2560,8,160,1,1,balanced,4.939546585083008
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,6144,2560,8,160,1,1,balanced,38.68295542399088
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,6144,2560,8,160,1,1,power_law_1.2,0.8659071922302246
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,6144,2560,8,160,1,1,power_law_1.01,2.438483238220215
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,6144,2560,8,160,1,1,power_law_1.2,1.2382335662841797
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,6144,2560,8,160,1,1,power_law_1.01,21.113702392578126
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,6144,2560,8,160,1,1,power_law_1.01,26.000698852539063
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,6144,2560,8,160,1,1,balanced,5.628719965616862
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,6144,2560,8,160,1,1,power_law_1.2,2.532486343383789
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,6144,2560,8,160,1,1,power_law_1.01,2.327436828613281
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,6144,2560,8,160,1,1,power_law_1.2,2.7258111953735353
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,6144,2560,8,160,1,1,power_law_1.2,2.910086441040039
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,6144,2560,8,160,1,1,power_law_1.01,40.521209716796875
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,6144,2560,8,160,1,1,power_law_1.01,38.07338256835938
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,6144,2560,8,160,1,1,power_law_1.01,2.531609535217285
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,6144,2560,8,160,1,1,power_law_1.2,3.028883171081543
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,6144,2560,8,160,1,1,balanced,8.415445327758789
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,6144,2560,8,160,1,1,balanced,20.601370493570965
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,6144,2560,8,160,1,1,power_law_1.2,3.1413951873779298
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,6144,2560,8,160,1,1,power_law_1.2,3.2892608642578125
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,6144,2560,8,160,1,1,power_law_1.01,2.5813056945800783
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,6144,2560,8,160,1,1,power_law_1.2,3.3867774963378907
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,6144,2560,8,160,1,1,power_law_1.01,2.9434303283691405
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,6144,2560,8,160,1,1,balanced,11.39291254679362
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,6144,2560,8,160,1,1,power_law_1.2,3.430003356933594
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,6144,2560,8,160,1,1,power_law_1.01,70.09149169921875
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,6144,2560,8,160,1,1,power_law_1.01,3.237235260009766
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,6144,2560,8,160,1,1,power_law_1.2,3.67217903137207
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,6144,2560,8,160,1,1,power_law_1.01,3.814566421508789
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,6144,2560,8,160,1,1,power_law_1.2,3.7878528594970704
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,6144,2560,8,160,1,1,power_law_1.01,4.970105743408203
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,6144,2560,8,160,1,1,power_law_1.2,3.955596923828125
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,6144,2560,8,160,1,1,power_law_1.01,6.181734466552735
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,6144,2560,8,160,1,1,power_law_1.2,3.871744155883789
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,6144,2560,8,160,1,1,balanced,16.204437255859375
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,6144,2560,8,160,1,1,power_law_1.01,8.692479705810547
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,6144,2560,8,160,1,1,power_law_1.2,4.3859710693359375
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,6144,2560,8,160,1,1,power_law_1.2,5.319718551635742
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,6144,2560,8,160,1,1,power_law_1.01,11.264262390136718
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,6144,2560,8,160,1,1,power_law_1.2,6.5333503723144535
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,6144,2560,8,160,1,1,power_law_1.01,16.475628662109376
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,6144,2560,8,160,1,1,power_law_1.2,6.984352111816406
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,6144,2560,8,160,1,1,power_law_1.2,8.437165069580079
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,6144,2560,8,160,1,1,power_law_1.01,21.772665405273436
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,6144,2560,8,160,1,1,balanced,22.3218994140625
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,6144,2560,8,160,1,1,power_law_1.2,8.648051452636718
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,6144,2560,8,160,1,1,power_law_1.01,27.19928894042969
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,6144,2560,8,160,1,1,power_law_1.2,10.535417938232422
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,6144,2560,8,160,1,1,balanced,68.46870930989583
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,6144,2560,8,160,1,1,power_law_1.2,12.631289672851562
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,6144,2560,8,160,1,1,power_law_1.01,43.67814331054687
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,6144,2560,8,160,1,1,power_law_1.2,16.663174438476563
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,6144,2560,8,160,1,1,power_law_1.2,0.14001920223236083
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,6144,2560,8,160,1,1,balanced,39.64824422200521
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,6144,2560,8,160,1,1,power_law_1.2,21.69075164794922
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,6144,2560,8,160,1,1,power_law_1.2,0.15205119848251342
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,6144,2560,8,160,1,1,balanced,26.88989766438802
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,6144,2560,8,160,1,1,power_law_1.2,0.28705921173095705
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,6144,2560,8,160,1,1,power_law_1.2,0.45720319747924804
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,6144,2560,8,160,1,1,power_law_1.2,25.764923095703125
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,6144,2560,8,160,1,1,power_law_1.01,89.58682861328126
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,6144,2560,8,160,1,1,power_law_1.2,0.6433472156524658
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,6144,2560,8,160,1,1,power_law_1.2,1.3277055740356445
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,6144,2560,8,160,1,1,power_law_1.2,1.4514176368713378
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,6144,2560,8,160,1,1,power_law_1.2,37.30522766113281
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,6144,2560,8,160,1,1,power_law_1.2,1.5575743675231934
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,6144,2560,8,160,1,1,power_law_1.2,1.6239871978759766
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,6144,2560,8,160,1,1,power_law_1.2,1.5972160339355468
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,6144,2560,8,160,1,1,power_law_1.2,1.66046085357666
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,6144,2560,8,160,1,1,power_law_1.2,70.46732177734376
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,6144,2560,8,160,1,1,power_law_1.2,1.7446847915649415
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,6144,2560,8,160,1,1,power_law_1.2,1.7985088348388671
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,6144,2560,8,160,1,1,power_law_1.2,1.8541759490966796
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,6144,2560,8,160,1,1,balanced,44.6511484781901
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,6144,2560,8,160,1,1,power_law_1.2,1.902560043334961
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,6144,2560,8,160,1,1,power_law_1.2,1.971583938598633
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,6144,2560,8,160,1,1,power_law_1.2,2.0731327056884767
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,6144,2560,8,160,1,1,power_law_1.2,2.31845760345459
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,6144,2560,8,160,1,1,power_law_1.2,2.5029375076293947
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,6144,2560,8,160,1,1,power_law_1.2,3.0259647369384766
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,6144,2560,8,160,1,1,power_law_1.2,3.2898494720458986
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,6144,2560,8,160,1,1,power_law_1.2,4.055219268798828
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,6144,2560,8,160,1,1,power_law_1.2,4.629587173461914
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,6144,2560,8,160,1,1,power_law_1.2,5.773036956787109
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,6144,2560,8,160,1,1,power_law_1.2,6.9565376281738285
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,6144,2560,8,160,1,1,power_law_1.2,9.307577514648438
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,6144,2560,8,160,1,1,power_law_1.2,11.34395523071289
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,6144,2560,8,160,1,1,power_law_1.2,13.838092041015624
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,6144,2560,8,160,1,1,power_law_1.2,21.04680938720703
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,6144,2560,8,160,1,1,power_law_1.2,41.671173095703125
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,6144,2560,8,160,1,1,balanced,91.83575439453125
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,6144,2560,8,160,1,1,power_law_1.2,0.16883840560913085
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,6144,2560,8,160,1,1,power_law_1.2,0.1815551996231079
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,6144,2560,8,160,1,1,power_law_1.2,0.2973759889602661
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,6144,2560,8,160,1,1,power_law_1.2,0.49504637718200684
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,6144,2560,8,160,1,1,power_law_1.2,0.6678656101226806
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,7168,2048,8,384,1,1,balanced,0.22503999869028726
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,6144,2560,8,160,1,1,power_law_1.2,1.3833215713500977
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,6144,2560,8,160,1,1,power_law_1.2,1.4718015670776368
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,7168,2048,8,384,1,1,balanced,0.36212265491485596
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,7168,2048,8,384,1,1,balanced,0.682698647181193
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,6144,2560,8,160,1,1,power_law_1.2,1.5728639602661132
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,7168,2048,8,384,1,1,balanced,1.3462665875752766
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,6144,2560,8,160,1,1,power_law_1.2,1.6272384643554687
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,7168,2048,8,384,1,1,balanced,2.6277759869893393
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,6144,2560,8,160,1,1,power_law_1.2,1.7738687515258789
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,7168,2048,8,384,1,1,balanced,5.161722819010417
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,6144,2560,8,160,1,1,power_law_1.2,1.8603071212768554
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,7168,2048,8,384,1,1,balanced,7.775381088256836
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,6144,2560,8,160,1,1,power_law_1.2,2.024710464477539
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,7168,2048,8,384,1,1,balanced,7.75331179300944
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,6144,2560,8,160,1,1,power_law_1.2,2.1271488189697267
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,7168,2048,8,384,1,1,balanced,7.791685104370117
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,6144,2560,8,160,1,1,power_law_1.2,2.295430374145508
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,7168,2048,8,384,1,1,balanced,7.759925206502278
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,6144,2560,8,160,1,1,power_law_1.2,2.5121152877807615
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,7168,2048,8,384,1,1,balanced,7.85371208190918
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,7168,2048,8,384,1,1,balanced,7.842010498046875
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,7168,2048,8,384,1,1,balanced,0.13537066181500754
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,6144,2560,8,160,1,1,power_law_1.2,2.396447944641113
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,7168,2048,8,384,1,1,balanced,7.854677200317383
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,7168,2048,8,384,1,1,balanced,0.2056480050086975
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,7168,2048,8,384,1,1,balanced,0.3676160176595052
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,7168,2048,8,384,1,1,balanced,0.6943413416544596
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,7168,2048,8,384,1,1,balanced,7.837242762247722
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,6144,2560,8,160,1,1,power_law_1.2,2.559846305847168
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,7168,2048,8,384,1,1,balanced,1.349013328552246
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,7168,2048,8,384,1,1,balanced,2.6309760411580405
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,7168,2048,8,384,1,1,balanced,7.902320226033528
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,7168,2048,8,384,1,1,balanced,3.895893414815267
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,7168,2048,8,384,1,1,balanced,3.942981402079264
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,6144,2560,8,160,1,1,power_law_1.2,2.695430374145508
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,7168,2048,8,384,1,1,balanced,7.883583704630534
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,7168,2048,8,384,1,1,power_law_1.01,0.22536959648132324
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,7168,2048,8,384,1,1,balanced,3.9410934448242188
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,6144,2560,8,160,1,1,power_law_1.2,3.0397056579589843
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,7168,2048,8,384,1,1,balanced,3.9637492497762046
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,7168,2048,8,384,1,1,balanced,7.953151702880859
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,7168,2048,8,384,1,1,power_law_1.01,0.3625407934188843
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,7168,2048,8,384,1,1,balanced,3.953536033630371
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,7168,2048,8,384,1,1,balanced,0.21331199010213217
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,6144,2560,8,160,1,1,power_law_1.2,3.380691146850586
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,7168,2048,8,384,1,1,power_law_1.01,0.6769152164459229
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,7168,2048,8,384,1,1,balanced,8.052768071492514
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,7168,2048,8,384,1,1,balanced,3.97705078125
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,7168,2048,8,384,1,1,balanced,0.28140799204508465
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,6144,2560,8,160,1,1,power_law_1.2,3.92674560546875
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,7168,2048,8,384,1,1,power_law_1.01,0.9282112121582031
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,7168,2048,8,384,1,1,balanced,0.42369600137074787
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,7168,2048,8,384,1,1,balanced,4.015445391337077
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,7168,2048,8,384,1,1,balanced,8.286981582641602
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,7168,2048,8,384,1,1,balanced,0.7446933587392172
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,6144,2560,8,160,1,1,power_law_1.2,5.125215911865235
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,7168,2048,8,384,1,1,balanced,4.044949213663737
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,7168,2048,8,384,1,1,power_law_1.01,1.9508096694946289
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,7168,2048,8,384,1,1,balanced,1.3876214027404785
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,7168,2048,8,384,1,1,balanced,4.090053240458171
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,7168,2048,8,384,1,1,balanced,8.510554631551107
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,6144,2560,8,160,1,1,power_law_1.2,6.322425460815429
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,7168,2048,8,384,1,1,power_law_1.01,0.13600640296936034
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,7168,2048,8,384,1,1,balanced,2.6719627380371094
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,7168,2048,8,384,1,1,balanced,4.122890790303548
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,7168,2048,8,384,1,1,power_law_1.01,0.20522239208221435
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,7168,2048,8,384,1,1,balanced,3.9483839670817056
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,6144,2560,8,160,1,1,power_law_1.2,8.73864974975586
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,7168,2048,8,384,1,1,power_law_1.01,2.9635391235351562
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,7168,2048,8,384,1,1,balanced,4.195861180623372
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,7168,2048,8,384,1,1,balanced,8.725584030151367
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,7168,2048,8,384,1,1,balanced,3.959797223409017
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,7168,2048,8,384,1,1,power_law_1.01,0.36516480445861815
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,7168,2048,8,384,1,1,balanced,4.270917256673177
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,6144,2560,8,160,1,1,power_law_1.2,11.256639862060547
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,7168,2048,8,384,1,1,balanced,3.969461441040039
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,7168,2048,8,384,1,1,power_law_1.01,3.4393280029296873
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,7168,2048,8,384,1,1,power_law_1.01,0.4463871955871582
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,7168,2048,8,384,1,1,balanced,4.3220265706380205
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,7168,2048,8,384,1,1,balanced,9.083226521809896
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,7168,2048,8,384,1,1,balanced,3.9813226064046225
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,7168,2048,8,384,1,1,power_law_1.01,0.9819711685180664
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,7168,2048,8,384,1,1,balanced,4.484442710876465
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,6144,2560,8,160,1,1,power_law_1.2,16.366648864746093
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,7168,2048,8,384,1,1,power_law_1.01,4.647673416137695
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,7168,2048,8,384,1,1,balanced,3.9976425170898438
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,7168,2048,8,384,1,1,power_law_1.01,1.4750335693359375
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,7168,2048,8,384,1,1,balanced,4.67631467183431
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,7168,2048,8,384,1,1,balanced,9.563738505045572
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,7168,2048,8,384,1,1,balanced,4.017141342163086
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,6144,2560,8,160,1,1,power_law_1.2,21.337298583984374
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,7168,2048,8,384,1,1,power_law_1.01,1.7933439254760741
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,7168,2048,8,384,1,1,power_law_1.01,4.989491271972656
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,7168,2048,8,384,1,1,balanced,4.040010770161946
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,7168,2048,8,384,1,1,balanced,4.950906753540039
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,7168,2048,8,384,1,1,power_law_1.01,2.4182144165039063
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,7168,2048,8,384,1,1,power_law_1.01,5.195552062988281
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,7168,2048,8,384,1,1,balanced,4.082634607950847
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,7168,2048,8,384,1,1,power_law_1.01,2.519481658935547
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,6144,2560,8,160,1,1,power_law_1.2,26.482196044921874
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,7168,2048,8,384,1,1,balanced,5.163306554158528
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,7168,2048,8,384,1,1,balanced,10.252037048339844
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,7168,2048,8,384,1,1,balanced,4.134138743082683
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,7168,2048,8,384,1,1,power_law_1.01,5.403564834594727
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,7168,2048,8,384,1,1,power_law_1.01,2.7097471237182615
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,7168,2048,8,384,1,1,balanced,4.180266698201497
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,7168,2048,8,384,1,1,power_law_1.01,2.848851203918457
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,7168,2048,8,384,1,1,balanced,5.727024078369141
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,7168,2048,8,384,1,1,power_law_1.01,5.569190216064453
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,6144,2560,8,160,1,1,power_law_1.2,42.677490234375
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,7168,2048,8,384,1,1,balanced,4.273290634155273
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,7168,2048,8,384,1,1,balanced,12.041605631510416
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,7168,2048,8,384,1,1,power_law_1.01,2.9392831802368162
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,7168,2048,8,384,1,1,power_law_1.01,5.754655838012695
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,7168,2048,8,384,1,1,balanced,4.476645469665527
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,7168,2048,8,384,1,1,power_law_1.01,3.0482559204101562
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,7168,2048,8,384,1,1,balanced,7.0517120361328125
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,7168,2048,8,384,1,1,power_law_1.01,5.984716796875
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,7168,2048,8,384,1,1,power_law_1.01,3.271865463256836
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,7168,2048,8,384,1,1,power_law_1.01,6.190796661376953
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,7168,2048,8,384,1,1,power_law_1.01,3.485055923461914
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,6144,2560,8,160,1,1,power_law_1.2,86.13829956054687
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,7168,2048,8,384,1,1,power_law_1.01,6.359916687011719
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,384,1,1,balanced,4.656869252522786
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,7168,2048,8,384,1,1,power_law_1.01,3.7642303466796876
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,7168,2048,8,384,1,1,balanced,13.020299275716146
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,7168,2048,8,384,1,1,power_law_1.01,6.759238433837891
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,7168,2048,8,384,1,1,power_law_1.01,3.4888256072998045
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,7168,2048,8,384,1,1,balanced,7.999909083048503
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,7168,2048,8,384,1,1,power_law_1.01,3.7802047729492188
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,7168,2048,8,384,1,1,power_law_1.01,7.286278533935547
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,7168,2048,8,384,1,1,power_law_1.01,4.559532928466797
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,7168,2048,8,384,1,1,power_law_1.01,9.343154907226562
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,7168,2048,8,384,1,1,power_law_1.01,5.408211135864258
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,384,1,1,balanced,5.048704147338867
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,7168,2048,8,384,1,1,power_law_1.01,11.33543701171875
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,7168,2048,8,384,1,1,power_law_1.01,5.1934974670410154
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,7168,2048,8,384,1,1,balanced,18.319615681966145
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,7168,2048,8,384,1,1,power_law_1.01,10.636934661865235
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,7168,2048,8,384,1,1,balanced,11.04196294148763
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,384,1,1,balanced,5.389973322550456
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,7168,2048,8,384,1,1,power_law_1.01,6.385055923461914
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,7168,2048,8,384,1,1,power_law_1.01,5.620499038696289
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,7168,2048,8,384,1,1,power_law_1.01,13.076524353027343
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,384,1,1,balanced,6.036037445068359
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,7168,2048,8,384,1,1,power_law_1.01,6.689849853515625
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,7168,2048,8,384,1,1,power_law_1.01,10.477043151855469
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,7168,2048,8,384,1,1,power_law_1.01,9.099359893798828
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,384,1,1,balanced,7.093568166097005
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,7168,2048,8,384,1,1,power_law_1.01,12.682380676269531
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,7168,2048,8,384,1,1,power_law_1.2,0.22602241039276122
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,7168,2048,8,384,1,1,power_law_1.01,11.496205139160157
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,7168,2048,8,384,1,1,power_law_1.2,0.3628671884536743
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,7168,2048,8,384,1,1,power_law_1.01,0.22398080825805664
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,7168,2048,8,384,1,1,power_law_1.01,16.027020263671876
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,7168,2048,8,384,1,1,balanced,14.592549641927084
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,7168,2048,8,384,1,1,power_law_1.2,0.4963071823120117
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,7168,2048,8,384,1,1,balanced,26.488352457682293
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,384,1,1,balanced,8.290229161580404
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,7168,2048,8,384,1,1,power_law_1.01,12.486297607421875
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,7168,2048,8,384,1,1,power_law_1.01,0.29894399642944336
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,7168,2048,8,384,1,1,power_law_1.2,0.8611712455749512
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,7168,2048,8,384,1,1,power_law_1.01,20.08831329345703
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,7168,2048,8,384,1,1,power_law_1.01,0.46097278594970703
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,7168,2048,8,384,1,1,power_law_1.2,1.653753662109375
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,7168,2048,8,384,1,1,power_law_1.01,14.758828735351562
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,7168,2048,8,384,1,1,power_law_1.01,0.5160768032073975
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,7168,2048,8,384,1,1,power_law_1.2,2.404729652404785
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,7168,2048,8,384,1,1,power_law_1.01,1.0351807594299316
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,7168,2048,8,384,1,1,power_law_1.01,23.439244079589844
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,7168,2048,8,384,1,1,power_law_1.2,2.9519168853759767
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,384,1,1,balanced,13.468522389729818
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,7168,2048,8,384,1,1,power_law_1.01,23.748728942871093
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,7168,2048,8,384,1,1,power_law_1.01,1.5727359771728515
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,7168,2048,8,384,1,1,power_law_1.2,4.415180969238281
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,7168,2048,8,384,1,1,power_law_1.01,1.8214591979980468
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,7168,2048,8,384,1,1,power_law_1.01,27.46944580078125
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,7168,2048,8,384,1,1,power_law_1.2,4.6949310302734375
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,7168,2048,8,384,1,1,power_law_1.01,2.3888576507568358
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,7168,2048,8,384,1,1,power_law_1.2,4.90142707824707
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,7168,2048,8,384,1,1,power_law_1.01,41.399603271484374
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,7168,2048,8,384,1,1,power_law_1.01,2.5624704360961914
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,7168,2048,8,384,1,1,power_law_1.2,5.3434814453125
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,7168,2048,8,384,1,1,power_law_1.01,2.7332096099853516
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,384,1,1,balanced,16.46713129679362
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,7168,2048,8,384,1,1,power_law_1.01,39.2554443359375
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,7168,2048,8,384,1,1,power_law_1.01,2.770809555053711
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,7168,2048,8,384,1,1,power_law_1.2,5.574259185791016
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,7168,2048,8,384,1,1,balanced,21.348495483398438
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,7168,2048,8,384,1,1,power_law_1.01,2.992723274230957
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,7168,2048,8,384,1,1,power_law_1.2,5.781689453125
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,7168,2048,8,384,1,1,balanced,35.82184600830078
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,7168,2048,8,384,1,1,power_law_1.01,3.138796806335449
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,7168,2048,8,384,1,1,power_law_1.2,5.982534408569336
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,7168,2048,8,384,1,1,power_law_1.01,3.4836799621582033
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,7168,2048,8,384,1,1,power_law_1.2,6.145363235473633
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,7168,2048,8,384,1,1,power_law_1.01,70.01739501953125
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,7168,2048,8,384,1,1,power_law_1.01,3.7035137176513673
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,7168,2048,8,384,1,1,power_law_1.2,6.227987289428711
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,7168,2048,8,384,1,1,power_law_1.01,3.948223876953125
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,384,1,1,balanced,24.10084279378255
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,7168,2048,8,384,1,1,power_law_1.2,6.751487731933594
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,7168,2048,8,384,1,1,power_law_1.01,4.476224136352539
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,7168,2048,8,384,1,1,power_law_1.2,7.53095703125
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,7168,2048,8,384,1,1,power_law_1.01,5.488883209228516
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,7168,2048,8,384,1,1,power_law_1.2,9.519891357421875
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,384,1,1,power_law_1.01,5.338809585571289
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,7168,2048,8,384,1,1,power_law_1.2,11.477279663085938
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,7168,2048,8,384,1,1,power_law_1.2,11.370796966552735
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,384,1,1,power_law_1.01,5.193119812011719
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,7168,2048,8,384,1,1,power_law_1.2,14.07352294921875
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,384,1,1,power_law_1.01,6.039859390258789
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,384,1,1,balanced,32.068196614583336
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,7168,2048,8,384,1,1,power_law_1.2,11.179424285888672
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,384,1,1,power_law_1.01,7.679360198974609
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,384,1,1,power_law_1.01,7.99438705444336
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,7168,2048,8,384,1,1,power_law_1.2,13.355775451660156
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,384,1,1,power_law_1.01,10.625107574462891
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,7168,2048,8,384,1,1,power_law_1.2,17.385491943359376
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,384,1,1,power_law_1.01,13.278022766113281
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,7168,2048,8,384,1,1,power_law_1.2,21.041261291503908
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,384,1,1,power_law_1.01,18.911744689941408
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,7168,2048,8,384,1,1,balanced,41.84927876790365
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,7168,2048,8,384,1,1,power_law_1.2,24.152281188964842
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,384,1,1,power_law_1.01,24.479373168945312
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,7168,2048,8,384,1,1,balanced,67.87986755371094
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,7168,2048,8,384,1,1,power_law_1.2,28.602200317382813
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,384,1,1,power_law_1.01,30.230322265625
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,384,1,1,balanced,49.849456787109375
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,7168,2048,8,384,1,1,power_law_1.2,40.89927673339844
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,384,1,1,power_law_1.01,47.5465087890625
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,7168,2048,8,384,1,1,power_law_1.2,71.22377319335938
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,7168,2048,8,384,1,1,power_law_1.2,0.1358464002609253
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,384,1,1,power_law_1.01,95.28876342773438
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,7168,2048,8,384,1,1,power_law_1.2,0.20655360221862792
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,7168,2048,8,384,1,1,power_law_1.2,0.27457919120788576
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,7168,2048,8,384,1,1,power_law_1.2,0.4944320201873779
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,7168,2048,8,384,1,1,power_law_1.2,0.8759552001953125
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,7168,2048,8,384,1,1,power_law_1.2,1.3118144035339356
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,7168,2048,8,384,1,1,power_law_1.2,1.5480256080627441
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,7168,2048,8,384,1,1,power_law_1.2,2.270252799987793
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,7168,2048,8,384,1,1,power_law_1.2,2.46942081451416
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,7168,2048,8,384,1,1,power_law_1.2,2.562041664123535
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,7168,2048,8,384,1,1,power_law_1.2,2.7600896835327147
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,7168,2048,8,384,1,1,power_law_1.2,2.8103103637695312
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,7168,2048,8,384,1,1,power_law_1.2,2.91473274230957
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,7168,2048,8,384,1,1,power_law_1.2,3.495859146118164
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,7168,2048,8,384,1,1,power_law_1.2,3.7105152130126955
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,7168,2048,8,384,1,1,power_law_1.2,3.8633342742919923
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,384,1,1,balanced,98.08545939127605
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,7168,2048,8,384,1,1,power_law_1.2,3.614316940307617
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,7168,2048,8,384,1,1,power_law_1.2,4.074272155761719
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,7168,2048,8,384,1,1,power_law_1.2,4.821881484985352
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,7168,2048,8,384,1,1,power_law_1.2,5.7653953552246096
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,7168,2048,8,384,1,1,power_law_1.2,5.654451370239258
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,7168,2048,8,384,1,1,power_law_1.2,7.042393493652344
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,7168,2048,8,384,1,1,power_law_1.2,5.981472015380859
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,7168,2048,8,384,1,1,power_law_1.2,0.2185920000076294
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,7168,2048,8,384,1,1,power_law_1.2,7.2371070861816404
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,7168,2048,8,384,1,1,power_law_1.2,0.2989311933517456
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,7168,2048,8,384,1,1,power_law_1.2,9.764991760253906
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,7168,2048,8,384,1,1,power_law_1.2,0.3563584089279175
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,7168,2048,8,384,1,1,power_law_1.2,0.5356800079345703
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,7168,2048,8,384,1,1,power_law_1.2,12.143590545654297
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,7168,2048,8,384,1,1,power_law_1.2,0.8966015815734864
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,7168,2048,8,384,1,1,power_law_1.2,1.34335355758667
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,7168,2048,8,384,1,1,power_law_1.2,13.117561340332031
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,7168,2048,8,384,1,1,power_law_1.2,1.5748479843139649
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,7168,2048,8,384,1,1,power_law_1.2,15.670252990722656
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,7168,2048,8,384,1,1,power_law_1.2,2.326534461975098
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,7168,2048,8,384,1,1,power_law_1.2,2.343008041381836
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,7168,2048,8,384,1,1,power_law_1.2,24.29174346923828
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,7168,2048,8,384,1,1,power_law_1.2,2.569503974914551
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,7168,2048,8,384,1,1,power_law_1.2,2.78353271484375
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,7168,2048,8,384,1,1,power_law_1.2,2.9236799240112306
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,7168,2048,8,384,1,1,power_law_1.2,41.79473876953125
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,7168,2048,8,384,1,1,power_law_1.2,3.109452819824219
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,7168,2048,8,384,1,1,power_law_1.2,3.4894527435302733
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,7168,2048,8,384,1,1,power_law_1.2,3.732819366455078
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,128,1,1,balanced,0.09954667091369629
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,128,1,1,power_law_1.01,0.10003839731216431
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,7168,2048,8,384,1,1,power_law_1.2,4.021836853027343
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,128,1,1,power_law_1.2,0.10016000270843506
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,7168,2048,8,384,1,1,power_law_1.2,4.547404861450195
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,7168,2048,8,384,1,1,power_law_1.2,5.473471832275391
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,384,1,1,power_law_1.2,5.477753448486328
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,128,1,1,balanced,0.12470400333404541
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,128,1,1,power_law_1.01,0.1211583971977234
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,128,1,1,power_law_1.2,0.12055679559707641
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,384,1,1,power_law_1.2,5.329126358032227
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,128,1,1,power_law_1.2,0.14862719774246216
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,128,1,1,balanced,0.1856373349825541
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,128,1,1,power_law_1.01,0.14566400051116943
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,384,1,1,power_law_1.2,6.206764984130859
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,384,1,1,power_law_1.2,7.987776184082032
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,128,1,1,power_law_1.2,0.161190402507782
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,128,1,1,balanced,0.20919466018676758
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,128,1,1,power_law_1.01,0.15649919509887694
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,384,1,1,power_law_1.2,8.498560333251953
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,32,1,1,balanced,0.09761599699656169
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,32,1,1,power_law_1.01,0.09740800261497498
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,384,1,1,power_law_1.2,10.961241912841796
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,384,1,1,power_law_1.2,13.579808044433594
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,32,1,1,balanced,0.12484799822171529
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,32,1,1,power_law_1.01,0.1126911997795105
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,384,1,1,power_law_1.2,18.917088317871094
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,128,1,1,power_law_1.2,0.19050240516662598
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,128,1,1,balanced,0.3120693365732829
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,128,1,1,power_law_1.01,0.20836479663848878
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,128,1,1,power_law_1.2,0.25633280277252196
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,128,1,1,balanced,0.5833119948705038
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,32,1,1,balanced,0.1806079943974813
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,128,1,1,power_law_1.01,0.28786559104919435
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,32,1,1,power_law_1.01,0.13276159763336182
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,384,1,1,power_law_1.2,24.339859008789062
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,384,1,1,power_law_1.2,29.722573852539064
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,32,1,1,balanced,0.20430399974187216
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,32,1,1,power_law_1.01,0.11122560501098633
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,32,1,1,power_law_1.2,0.09689599871635438
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,128,1,1,power_law_1.2,0.3890496015548706
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,128,1,1,balanced,0.5851039886474609
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,32,1,1,power_law_1.2,0.10905599594116211
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,128,1,1,power_law_1.01,0.38676478862762453
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,128,1,1,power_law_1.2,0.4032639980316162
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,128,1,1,balanced,0.5879413286844889
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,32,1,1,power_law_1.2,0.1356927990913391
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,128,1,1,power_law_1.01,0.43228797912597655
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,384,1,1,power_law_1.2,46.58570861816406
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,32,1,1,balanced,0.17427200078964233
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,32,1,1,power_law_1.2,0.10103039741516114
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,32,1,1,power_law_1.01,0.16500480175018312
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,32,1,1,balanced,0.17470399538675943
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,32,1,1,power_law_1.2,0.16832000017166138
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,32,1,1,power_law_1.01,0.16654720306396484
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,128,1,1,power_law_1.2,0.4538303852081299
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,32,1,1,power_law_1.2,0.1668352007865906
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,128,1,1,balanced,0.5861813227335612
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,128,1,1,power_law_1.01,0.440172815322876
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,128,1,1,power_law_1.2,0.4623424053192139
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,32,1,1,balanced,0.1750026742617289
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,32,1,1,power_law_1.2,0.19100799560546874
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,128,1,1,balanced,0.5870399872461954
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,32,1,1,power_law_1.01,0.1927616000175476
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,128,1,1,power_law_1.01,0.4410880088806152
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,32,1,1,balanced,0.1745013395945231
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,32,1,1,power_law_1.2,0.19612159729003906
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,32,1,1,power_law_1.01,0.19667840003967285
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,384,1,1,power_law_1.2,92.92760620117187
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,32,1,1,balanced,0.17500799894332886
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,128,1,1,power_law_1.2,0.4954368114471436
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,32,1,1,power_law_1.2,0.21079039573669434
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,128,1,1,balanced,0.5872639815012614
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,32,1,1,power_law_1.01,0.21055359840393068
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,32,1,1,balanced,0.17614400386810303
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,32,1,1,power_law_1.2,0.2321471929550171
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,128,1,1,power_law_1.01,0.4824384212493896
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,32,1,1,power_law_1.01,0.232422399520874
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,32,1,1,balanced,0.17586666345596313
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,32,1,1,power_law_1.2,0.26280319690704346
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,128,1,1,power_law_1.2,0.540883207321167
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,32,1,1,power_law_1.01,0.25896320343017576
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,128,1,1,balanced,0.5872906843821207
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,128,1,1,power_law_1.01,0.5254848003387451
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,128,1,1,power_law_1.2,0.5914944171905517
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,128,1,1,balanced,0.5873813231786092
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,32,1,1,balanced,0.19979200760523477
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,32,1,1,power_law_1.2,0.25024640560150146
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,32,1,1,power_law_1.01,0.2534463882446289
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,128,1,1,power_law_1.01,0.545139217376709
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,32,1,1,power_law_1.2,0.2698048114776611
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,32,1,1,balanced,0.2005066672960917
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,128,1,1,power_law_1.2,0.6597119808197022
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,32,1,1,power_law_1.01,0.2645375967025757
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,128,1,1,balanced,0.5881760120391846
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,4096,14336,2,8,1,2,balanced,0.12098667025566101
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,32,1,1,power_law_1.2,0.30741760730743406
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,32,1,1,balanced,0.2023893396059672
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,128,1,1,power_law_1.01,0.6325695991516114
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,4096,14336,2,8,1,2,balanced,0.18652266263961792
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,32,1,1,power_law_1.01,0.31062400341033936
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,4096,14336,2,8,1,2,balanced,0.3522506554921468
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,128,1,1,power_law_1.2,0.7085951805114746
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,4096,14336,2,8,1,2,balanced,0.353002667427063
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,128,1,1,balanced,0.5897333224614462
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,4096,14336,2,8,1,2,balanced,0.352512001991272
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,128,1,1,power_law_1.01,0.7050176143646241
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,4096,14336,2,8,1,2,balanced,0.354912002881368
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,4096,14336,2,8,1,2,balanced,0.3560906648635864
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,32,1,1,power_law_1.2,0.3485503911972046
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,32,1,1,balanced,0.25835732618967694
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,32,1,1,power_law_1.01,0.33345279693603513
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,128,1,1,power_law_1.2,0.7887551784515381
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,128,1,1,balanced,0.5918293396631876
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,4096,14336,2,8,1,2,balanced,0.35816534360249835
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,128,1,1,power_law_1.01,0.7570432186126709
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,4096,14336,2,8,1,2,balanced,0.37307198842366535
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,32,1,1,power_law_1.2,0.3607039928436279
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,32,1,1,balanced,0.25890133778254193
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,32,1,1,power_law_1.01,0.36459519863128664
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,4096,14336,2,8,1,2,balanced,0.3752799828847249
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,128,1,1,power_law_1.2,0.9376128196716309
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,4096,14336,2,8,1,2,balanced,0.38496001561482746
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,128,1,1,balanced,0.5963786840438843
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,32,1,1,power_law_1.2,0.42207999229431153
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,32,1,1,balanced,0.2618666688601176
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,4096,14336,2,8,1,2,balanced,0.3883519967397054
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,32,1,1,power_law_1.01,0.423737621307373
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,128,1,1,power_law_1.01,0.8992192268371582
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,4096,14336,2,8,1,2,balanced,0.388314684232076
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,4096,14336,2,8,1,2,balanced,0.43374931812286377
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,32,1,1,balanced,0.5366826852162679
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,32,1,1,power_law_1.2,0.7687551975250244
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,32,1,1,power_law_1.01,0.7703487873077393
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,4096,14336,2,8,1,2,balanced,0.4166346788406372
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,4096,14336,2,8,1,2,balanced,0.418448011080424
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,32,1,1,power_law_1.2,0.8721023559570312
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,32,1,1,power_law_1.01,0.8519935607910156
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,32,1,1,balanced,0.5429493188858032
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,128,1,1,power_law_1.2,1.0011967658996581
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,4096,14336,2,8,1,2,balanced,0.44941866397857666
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,128,1,1,power_law_1.01,0.9370944023132324
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,128,1,1,balanced,0.7045066356658936
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,4096,14336,2,8,1,2,balanced,0.5177280108133951
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,4096,14336,2,8,1,2,balanced,0.5413920084635416
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,32,1,1,power_law_1.2,1.1149824142456055
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,32,1,1,power_law_1.01,1.1285440444946289
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,32,1,1,balanced,1.0230186780293782
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,4096,14336,2,8,1,2,balanced,0.7700213591257731
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,128,1,1,power_law_1.2,1.154636764526367
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,128,1,1,power_law_1.01,1.081651210784912
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,4096,14336,2,8,1,2,balanced,0.9250773588816324
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,128,1,1,balanced,0.7111199696858724
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,32,1,1,power_law_1.2,1.3544832229614259
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,32,1,1,balanced,1.0351040363311768
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,32,1,1,power_law_1.01,1.3541824340820312
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,4096,14336,2,8,1,2,balanced,1.3582827250162761
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,4096,14336,2,8,1,2,balanced,1.7855839729309082
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,32,1,1,power_law_1.2,1.8510528564453126
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,32,1,1,power_law_1.01,1.854047966003418
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,32,1,1,balanced,1.5363732973734539
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,4096,14336,2,8,1,2,balanced,2.6178132692972818
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,32,1,1,power_law_1.2,2.3481727600097657
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,32,1,1,power_law_1.01,2.358188819885254
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,32,1,1,balanced,2.0327626864115396
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,128,1,1,power_law_1.2,1.357254409790039
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,4096,14336,2,8,1,2,balanced,3.481712023417155
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,128,1,1,power_law_1.01,1.3071616172790528
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,128,1,1,balanced,0.9600586891174316
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,32,1,1,power_law_1.2,3.3018112182617188
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,32,1,1,power_law_1.01,3.3471233367919924
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,32,1,1,balanced,3.0016746520996094
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,4096,14336,2,8,1,2,balanced,5.425957361857097
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,128,1,1,power_law_1.2,1.5833663940429688
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,128,1,1,power_law_1.01,1.5281791687011719
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,32,1,1,power_law_1.2,4.284864044189453
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,32,1,1,balanced,3.989013353983561
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,32,1,1,power_law_1.01,4.302713775634766
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,128,1,1,balanced,0.9712373415629069
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,4096,14336,2,8,1,2,balanced,7.199701309204102
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,128,1,1,power_law_1.2,3.093631935119629
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,32,1,1,power_law_1.2,6.221164703369141
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,32,1,1,power_law_1.01,6.223519897460937
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,128,1,1,power_law_1.01,2.9281919479370115
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,32,1,1,balanced,5.958752314249675
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,4096,14336,2,8,1,2,balanced,9.124645233154297
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,128,1,1,balanced,2.023573398590088
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,128,1,1,power_law_1.2,3.574214553833008
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,32,1,1,power_law_1.2,8.174937438964843
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,32,1,1,power_law_1.01,8.230944061279297
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,128,1,1,balanced,2.0557333628336587
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,128,1,1,power_law_1.01,3.3746814727783203
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,32,1,1,balanced,7.928581237792969
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,4096,14336,2,8,1,2,balanced,0.08428266644477844
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,4096,14336,2,8,1,2,balanced,14.790362040201822
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,32,1,1,power_law_1.2,10.119487762451172
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,32,1,1,power_law_1.01,10.19573745727539
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,128,1,1,power_law_1.2,4.50445442199707
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,4096,14336,2,8,1,2,balanced,0.11748266220092773
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,4096,14336,2,8,1,2,balanced,0.19605332612991333
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,128,1,1,balanced,3.9377867380777993
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,128,1,1,power_law_1.01,4.328819274902344
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,4096,14336,2,8,1,2,balanced,0.2018346587816874
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,4096,14336,2,8,1,2,balanced,0.20004266500473022
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,32,1,1,power_law_1.2,16.107437133789062
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,4096,14336,2,8,1,2,balanced,0.20159467061360678
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,32,1,1,power_law_1.01,16.125433349609374
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,32,1,1,balanced,9.909354527791342
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,128,1,1,power_law_1.2,5.501068878173828
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,4096,14336,2,8,1,2,balanced,0.20193066199620566
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,128,1,1,balanced,4.002645174662272
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,4096,14336,2,8,1,2,balanced,0.2071146567662557
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,128,1,1,power_law_1.01,5.232787322998047
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,4096,14336,2,8,1,2,balanced,0.20617600282033285
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,32,1,1,power_law_1.2,32.38160095214844
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,4096,14336,2,8,1,2,balanced,0.20909865697224936
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,32,1,1,power_law_1.01,32.202392578125
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,4096,14336,2,8,1,2,balanced,0.21373866001764932
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,128,1,1,balanced,5.948127746582031
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,128,1,1,power_law_1.2,7.444844818115234
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,4096,14336,2,8,1,2,balanced,29.5293706258138
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,4096,14336,2,8,1,2,balanced,0.21374932924906412
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,4096,14336,2,8,1,2,balanced,0.21567465861638388
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,128,1,1,power_law_1.01,7.281574249267578
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,4096,14336,2,8,1,2,balanced,0.23104000091552734
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,4096,14336,2,8,1,2,balanced,0.25117866198221844
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,32,1,1,balanced,15.778106689453125
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,128,1,1,power_law_1.2,9.37557144165039
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,128,1,1,balanced,7.921328226725261
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,4096,14336,2,8,1,2,balanced,0.25306133429209393
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,4096,14336,2,8,1,2,balanced,0.269487996896108
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,4096,14336,2,8,1,2,balanced,0.3298773368199666
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,128,1,1,power_law_1.01,9.237996673583984
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,4096,14336,2,8,1,2,balanced,0.33630398909250897
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,128,1,1,power_law_1.2,11.294009399414062
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,128,1,1,power_law_1.01,11.241632080078125
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,4096,14336,2,8,1,2,balanced,0.4703199863433838
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,128,1,1,balanced,9.910613377888998
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,4096,14336,2,8,1,2,balanced,0.5665706793467203
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,4096,14336,2,8,1,2,balanced,0.8186559677124023
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,4096,14336,2,8,1,2,balanced,1.0846186478932698
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,128,1,1,power_law_1.2,17.420025634765626
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,128,1,1,power_law_1.01,17.2727294921875
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,4096,14336,2,8,1,2,balanced,1.5767839749654133
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,128,1,1,power_law_1.2,33.36064758300781
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,4096,14336,2,8,1,2,balanced,2.174352010091146
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,128,1,1,power_law_1.01,33.31253662109375
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,128,1,1,balanced,16.035722096761067
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,32,1,1,balanced,32.08960978190104
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,4096,14336,2,8,1,2,balanced,3.221109390258789
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,4096,14336,2,8,1,2,balanced,4.096255938212077
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,4096,14336,2,8,1,2,balanced,5.077712059020996
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,4096,14336,2,8,1,2,balanced,8.574533462524414
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,128,1,1,balanced,31.92017110188802
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,4096,14336,2,8,1,2,balanced,16.94806416829427
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,4096,14336,2,8,1,2,power_law_1.01,0.1863935947418213
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,4096,14336,2,8,1,2,power_law_1.01,0.2045504093170166
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,4096,14336,2,8,1,2,power_law_1.01,0.10908160209655762
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,4096,14336,2,8,1,2,power_law_1.01,0.2537856101989746
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,4096,14336,2,8,1,2,power_law_1.01,0.10187519788742065
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,4096,14336,2,8,1,2,power_law_1.01,0.3206655979156494
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,4096,14336,2,8,1,2,power_law_1.01,0.1649216055870056
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,4096,14336,2,8,1,2,power_law_1.01,0.3521087884902954
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,4096,14336,2,8,1,2,power_law_1.01,0.20083200931549072
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,4096,14336,2,8,1,2,power_law_1.01,0.37781760692596433
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,4096,14336,2,8,1,2,power_law_1.01,0.1992319941520691
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,4096,14336,2,8,1,2,balanced,0.07425066828727722
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,4096,14336,2,8,1,2,power_law_1.01,0.39688959121704104
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,4096,14336,2,8,1,2,power_law_1.01,0.21465599536895752
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,4096,14336,2,8,1,2,balanced,0.11428800225257874
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,4096,14336,2,8,1,2,power_law_1.01,0.4314112186431885
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,4096,14336,2,8,1,2,power_law_1.01,0.22323839664459227
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,4096,14336,2,8,1,2,balanced,0.19325333833694458
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,4096,14336,2,8,1,2,power_law_1.01,0.47876482009887694
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,4096,14336,2,8,1,2,power_law_1.01,0.22700159549713134
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,4096,14336,2,8,1,2,balanced,0.1957599918047587
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,4096,14336,2,8,1,2,power_law_1.01,0.4993855953216553
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,4096,14336,2,8,1,2,power_law_1.01,0.24017279148101806
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,4096,14336,2,8,1,2,balanced,0.1991573373476664
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,4096,14336,2,8,1,2,power_law_1.01,0.45967998504638674
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,4096,14336,2,8,1,2,power_law_1.01,0.24690558910369872
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,4096,14336,2,8,1,2,balanced,0.2000160018603007
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,4096,14336,2,8,1,2,power_law_1.01,0.47562241554260254
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,4096,14336,2,8,1,2,power_law_1.01,0.2344127893447876
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,4096,14336,2,8,1,2,balanced,0.20266133546829224
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,4096,14336,2,8,1,2,power_law_1.01,0.11381759643554687
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,4096,14336,2,8,1,2,power_law_1.01,0.5095295906066895
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,4096,14336,2,8,1,2,power_law_1.01,0.2521215915679932
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,4096,14336,2,8,1,2,balanced,0.20306134223937988
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,4096,14336,2,8,1,2,power_law_1.01,0.5259136199951172
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,4096,14336,2,8,1,2,power_law_1.01,0.13941119909286498
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,4096,14336,2,8,1,2,power_law_1.01,0.2748863935470581
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,4096,14336,2,8,1,2,power_law_1.01,0.14063359498977662
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,4096,14336,2,8,1,2,power_law_1.01,0.5551167964935303
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,4096,14336,2,8,1,2,power_law_1.01,0.17485439777374268
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,4096,14336,2,8,1,2,power_law_1.01,0.3024319887161255
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,4096,14336,2,8,1,2,power_law_1.01,0.19127680063247682
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,4096,14336,2,8,1,2,power_law_1.01,0.5898431777954102
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,4096,14336,2,8,1,2,power_law_1.01,0.3577023983001709
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,4096,14336,2,8,1,2,power_law_1.01,0.20941441059112548
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,4096,14336,2,8,1,2,power_law_1.01,0.5611519813537598
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,4096,14336,2,8,1,2,power_law_1.01,0.3848896026611328
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,4096,14336,2,8,1,2,power_law_1.01,0.24917759895324706
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,4096,14336,2,8,1,2,power_law_1.01,0.26720640659332273
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,4096,14336,2,8,1,2,power_law_1.01,0.34603519439697267
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,4096,14336,2,8,1,2,balanced,0.2060533364613851
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,4096,14336,2,8,1,2,power_law_1.01,0.7638847827911377
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,4096,14336,2,8,1,2,power_law_1.01,0.4293248176574707
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,4096,14336,2,8,1,2,power_law_1.01,0.9549056053161621
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,4096,14336,2,8,1,2,balanced,0.20861866076787314
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,4096,14336,2,8,1,2,power_law_1.01,0.48427519798278806
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,4096,14336,2,8,1,2,power_law_1.01,0.25220479965209963
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,4096,14336,2,8,1,2,power_law_1.01,1.157260799407959
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,4096,14336,2,8,1,2,power_law_1.2,0.15860480070114136
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,4096,14336,2,8,1,2,power_law_1.01,0.7770112037658692
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,4096,14336,2,8,1,2,power_law_1.01,0.2632319927215576
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,4096,14336,2,8,1,2,power_law_1.2,0.11028480529785156
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,4096,14336,2,8,1,2,power_law_1.01,1.4895999908447266
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,4096,14336,2,8,1,2,power_law_1.01,1.0108287811279297
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,4096,14336,2,8,1,2,power_law_1.2,0.2022847890853882
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,4096,14336,2,8,1,2,power_law_1.2,0.12570879459381104
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,4096,14336,2,8,1,2,power_law_1.01,2.085203170776367
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,4096,14336,2,8,1,2,power_law_1.2,0.27063679695129395
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,4096,14336,2,8,1,2,power_law_1.01,1.3865663528442382
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,4096,14336,2,8,1,2,power_law_1.2,0.35290238857269285
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,4096,14336,2,8,1,2,power_law_1.2,0.13338880538940429
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,4096,14336,2,8,1,2,power_law_1.01,2.756025505065918
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,4096,14336,2,8,1,2,power_law_1.01,1.6075199127197266
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,4096,14336,2,8,1,2,power_law_1.2,0.35155839920043946
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,4096,14336,2,8,1,2,power_law_1.2,0.19987839460372925
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,4096,14336,2,8,1,2,power_law_1.2,0.37982079982757566
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,4096,14336,2,8,1,2,power_law_1.01,2.622323226928711
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,4096,14336,2,8,1,2,power_law_1.01,4.813068771362305
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,4096,14336,2,8,1,2,balanced,0.2172000010808309
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,4096,14336,2,8,1,2,power_law_1.2,0.18670079708099366
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,4096,14336,2,8,1,2,power_law_1.2,0.4000063896179199
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,4096,14336,2,8,1,2,power_law_1.01,0.259935998916626
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,4096,14336,2,8,1,2,power_law_1.01,3.0145151138305666
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,4096,14336,2,8,1,2,power_law_1.2,0.43511037826538085
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,4096,14336,2,8,1,2,power_law_1.01,5.260812759399414
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,4096,14336,2,8,1,2,balanced,0.22099733352661133
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,4096,14336,2,8,1,2,power_law_1.2,0.21108479499816896
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,4096,14336,2,8,1,2,power_law_1.2,0.4983359813690186
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,4096,14336,2,8,1,2,power_law_1.01,0.27319040298461916
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,4096,14336,2,8,1,2,power_law_1.01,5.499193572998047
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,4096,14336,2,8,1,2,power_law_1.2,0.22997119426727294
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,4096,14336,2,8,1,2,balanced,0.22694933414459229
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,4096,14336,2,8,1,2,power_law_1.01,8.240582275390626
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,4096,14336,2,8,1,2,power_law_1.2,0.533951997756958
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,4096,14336,2,8,1,2,power_law_1.01,0.2882368087768555
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,4096,14336,2,8,1,2,balanced,0.2315946618715922
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,4096,14336,2,8,1,2,power_law_1.2,0.2315648078918457
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,4096,14336,2,8,1,2,power_law_1.2,0.4493760108947754
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,4096,14336,2,8,1,2,power_law_1.01,7.582431793212891
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,4096,14336,2,8,1,2,power_law_1.01,0.30037119388580324
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,4096,14336,2,8,1,2,power_law_1.2,0.4941567897796631
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,4096,14336,2,8,1,2,balanced,0.25998934110005695
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,4096,14336,2,8,1,2,power_law_1.01,13.259347534179687
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,4096,14336,2,8,1,2,power_law_1.2,0.23685119152069092
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,4096,14336,2,8,1,2,power_law_1.01,0.3473151922225952
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,4096,14336,2,8,1,2,power_law_1.01,8.508460998535156
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,4096,14336,2,8,1,2,power_law_1.2,0.4831232070922852
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,4096,14336,2,8,1,2,balanced,0.2680160005887349
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,4096,14336,2,8,1,2,power_law_1.2,0.24801919460296631
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,4096,14336,2,8,1,2,power_law_1.01,0.3655872106552124
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,4096,14336,2,8,1,2,power_law_1.2,0.5142975807189941
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,4096,14336,2,8,1,2,power_law_1.01,14.146310424804687
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,4096,14336,2,8,1,2,balanced,0.2805759906768799
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,4096,14336,2,8,1,2,power_law_1.2,0.24476161003112792
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,4096,14336,2,8,1,2,power_law_1.2,0.5484672069549561
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,4096,14336,2,8,1,2,power_law_1.01,13.697337341308593
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,4096,14336,2,8,1,2,power_law_1.01,0.4494016170501709
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,4096,14336,2,8,1,2,power_law_1.2,0.26081280708312987
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,4096,14336,2,8,1,2,balanced,0.418997327486674
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,4096,14336,2,8,1,2,power_law_1.2,0.5537471771240234
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,4096,14336,2,8,1,2,power_law_1.01,0.6826816082000733
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,4096,14336,2,8,1,2,power_law_1.2,0.10561280250549317
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,4096,14336,2,8,1,2,power_law_1.2,0.2664128065109253
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,4096,14336,2,8,1,2,power_law_1.2,0.6406015872955322
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,4096,14336,2,8,1,2,balanced,0.45258665084838867
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,4096,14336,2,8,1,2,power_law_1.01,24.11961669921875
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,4096,14336,2,8,1,2,power_law_1.01,0.7347904205322265
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,4096,14336,2,8,1,2,power_law_1.01,26.76331481933594
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,4096,14336,2,8,1,2,power_law_1.2,0.12349439859390259
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,4096,14336,2,8,1,2,power_law_1.2,0.3280064105987549
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,4096,14336,2,8,1,2,power_law_1.2,0.8234687805175781
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,4096,14336,2,8,1,2,balanced,0.6607253154118856
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,4096,14336,2,8,1,2,power_law_1.01,1.1451968193054198
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,4096,14336,2,8,1,2,power_law_1.2,0.14852479696273804
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,4096,14336,2,8,1,2,power_law_1.2,0.3682559967041016
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,4096,14336,2,8,1,2,power_law_1.01,1.1850943565368652
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,4096,14336,2,8,1,2,power_law_1.2,0.9428031921386719
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,4096,14336,2,8,1,2,balanced,0.8885546525319418
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,4096,14336,2,8,2,1,balanced,0.11664000153541565
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,4096,14336,2,8,1,2,power_law_1.2,0.1961856007575989
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,4096,14336,2,8,1,2,power_law_1.01,2.279532814025879
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,4096,14336,2,8,1,2,power_law_1.2,0.4164480209350586
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,4096,14336,2,8,1,2,power_law_1.2,1.5873920440673828
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,4096,14336,2,8,1,2,power_law_1.01,46.75650634765625
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,4096,14336,2,8,1,2,balanced,1.3272426923116047
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,4096,14336,2,8,1,2,power_law_1.2,0.34351999759674073
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,4096,14336,2,8,1,2,power_law_1.01,2.759391975402832
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,4096,14336,2,8,1,2,power_law_1.2,1.5400704383850097
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,4096,14336,2,8,1,2,power_law_1.2,0.19776639938354493
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,4096,14336,2,8,2,1,balanced,0.18573866287867227
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,4096,14336,2,8,1,2,power_law_1.2,0.22855041027069092
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,4096,14336,2,8,1,2,power_law_1.2,2.1644351959228514
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,4096,14336,2,8,1,2,power_law_1.2,0.47148799896240234
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,4096,14336,2,8,1,2,power_law_1.01,3.9530624389648437
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,4096,14336,2,8,2,1,balanced,0.34745601812998456
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,4096,14336,2,8,1,2,balanced,1.7775786717732747
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,4096,14336,2,8,1,2,power_law_1.2,0.24366719722747804
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,4096,14336,2,8,1,2,power_law_1.2,3.062630462646484
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,4096,14336,2,8,1,2,power_law_1.2,0.501094388961792
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,4096,14336,2,8,2,1,balanced,0.35145068168640137
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,4096,14336,2,8,1,2,power_law_1.01,5.633216094970703
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,4096,14336,2,8,1,2,balanced,2.6681226094563804
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,4096,14336,2,8,1,2,power_law_1.2,4.252358245849609
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,4096,14336,2,8,1,2,power_law_1.2,0.26584959030151367
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,4096,14336,2,8,2,1,balanced,0.353434681892395
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,4096,14336,2,8,1,2,power_law_1.2,0.7384448051452637
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,4096,14336,2,8,1,2,power_law_1.01,8.615814208984375
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,4096,14336,2,8,1,2,power_law_1.2,6.38719367980957
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,4096,14336,2,8,2,1,balanced,0.3549013137817383
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,4096,14336,2,8,1,2,power_law_1.2,0.9313728332519531
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,4096,14336,2,8,1,2,balanced,3.5303093592325845
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,4096,14336,2,8,1,2,power_law_1.01,9.40887680053711
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,4096,14336,2,8,2,1,balanced,0.3574399948120117
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,4096,14336,2,8,1,2,power_law_1.2,1.261567974090576
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,4096,14336,2,8,1,2,power_law_1.2,9.30228500366211
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,4096,14336,2,8,1,2,power_law_1.2,0.2659519910812378
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,4096,14336,2,8,2,1,balanced,0.3633066813151042
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,4096,14336,2,8,1,2,power_law_1.01,13.004794311523437
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,4096,14336,2,8,1,2,power_law_1.2,1.818124771118164
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,4096,14336,2,8,1,2,power_law_1.2,0.26578559875488283
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,4096,14336,2,8,1,2,balanced,5.301733334859212
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,4096,14336,2,8,1,2,power_law_1.2,13.914349365234376
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,4096,14336,2,8,2,1,balanced,0.36642134189605713
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,4096,14336,2,8,1,2,power_law_1.2,2.503763198852539
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,4096,14336,2,8,2,1,balanced,0.3691840171813965
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,4096,14336,2,8,1,2,power_law_1.01,20.64110107421875
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,4096,14336,2,8,1,2,power_law_1.2,15.638067626953125
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,4096,14336,2,8,1,2,power_law_1.2,3.874105453491211
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,4096,14336,2,8,1,2,power_law_1.2,0.26924159526824953
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,4096,14336,2,8,2,1,balanced,0.3786826531092326
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,4096,14336,2,8,1,2,balanced,7.037600199381511
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,4096,14336,2,8,1,2,power_law_1.2,0.28254721164703367
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,4096,14336,2,8,1,2,power_law_1.2,5.322278213500977
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,4096,14336,2,8,2,1,balanced,0.3770879904429118
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,4096,14336,2,8,1,2,power_law_1.2,25.825146484375
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,4096,14336,2,8,1,2,power_law_1.2,0.2924288034439087
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,4096,14336,2,8,2,1,balanced,0.37967999776204425
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,4096,14336,2,8,1,2,power_law_1.2,6.171859359741211
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,4096,14336,2,8,1,2,power_law_1.2,0.319648003578186
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,4096,14336,2,8,2,1,balanced,0.4158133268356323
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,4096,14336,2,8,1,2,power_law_1.01,56.6102783203125
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,4096,14336,2,8,1,2,balanced,8.836885452270508
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,4096,14336,2,8,1,2,power_law_1.2,0.33194239139556886
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,4096,14336,2,8,2,1,balanced,0.4233333269755046
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,4096,14336,2,8,1,2,power_law_1.2,9.26202850341797
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,4096,14336,2,8,1,2,power_law_1.2,0.35909759998321533
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,4096,14336,2,8,2,1,balanced,0.4257173140843709
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,4096,14336,2,8,1,2,power_law_1.2,52.40989379882812
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,4096,14336,2,8,1,2,power_law_1.2,0.4335487842559814
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,4096,14336,2,8,1,2,power_law_1.2,16.189543151855467
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,4096,14336,2,8,2,1,balanced,0.48263466358184814
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,4096,14336,2,8,1,2,power_law_1.2,0.6126399993896484
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,4096,14336,2,8,2,1,balanced,0.528058648109436
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,4096,14336,2,8,1,2,power_law_1.2,0.7966207981109619
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,4096,14336,2,8,1,2,balanced,14.354255676269531
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,4096,14336,2,8,2,1,balanced,0.5445866584777832
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,4096,14336,2,8,1,2,power_law_1.2,1.0928447723388672
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,4096,14336,2,8,1,2,power_law_1.2,32.8361083984375
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,4096,14336,2,8,2,1,balanced,0.7648213704427084
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,4096,14336,2,8,1,2,power_law_1.2,1.5696191787719727
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,4096,14336,2,8,2,1,balanced,0.954416036605835
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,4096,14336,2,8,1,2,power_law_1.2,2.3607744216918944
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,4096,14336,2,8,1,2,power_law_1.2,2.909145545959473
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,4096,14336,2,8,2,1,balanced,1.4008746147155762
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,4096,14336,2,8,1,2,power_law_1.2,3.7589439392089843
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,4096,14336,2,8,2,1,balanced,1.8387734095255535
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,4096,14336,2,8,1,2,power_law_1.2,6.253228759765625
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,4096,14336,2,8,2,1,balanced,2.6984427769978843
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,4096,14336,2,8,1,2,balanced,30.336100260416668
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,4096,14336,2,8,1,2,power_law_1.2,8.280319976806641
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,4096,14336,2,8,2,1,balanced,3.5801121393839517
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,4096,14336,2,8,1,2,power_law_1.2,12.396230316162109
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,4096,14336,2,8,2,1,balanced,5.443605422973633
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,4096,14336,2,8,1,2,power_law_1.2,15.073817443847656
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,4096,14336,2,8,2,1,balanced,7.394005457560222
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,4096,14336,2,8,1,2,power_law_1.2,23.31098175048828
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,4096,14336,2,8,2,1,balanced,9.149279912312826
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,4096,14336,2,8,1,2,power_law_1.2,52.25140380859375
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,4096,14336,2,8,2,1,balanced,14.941637674967447
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,4096,14336,2,8,2,1,balanced,29.6101557413737
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,4096,14336,2,8,2,1,balanced,0.07881600161393483
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,4096,14336,2,8,2,1,balanced,0.114464004834493
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,4096,14336,2,8,2,1,balanced,0.19268266359965006
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,4096,14336,2,8,2,1,balanced,0.19700799385706583
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,4096,14336,2,8,2,1,balanced,0.19820799430211386
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,4096,14336,2,8,2,1,balanced,0.19992534319559732
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,4096,14336,2,8,2,1,balanced,0.2039466698964437
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,4096,14336,2,8,2,1,balanced,0.2079733411471049
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,4096,14336,2,8,2,1,balanced,0.06958933174610138
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,4096,14336,2,8,2,1,balanced,0.20908800760904947
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,4096,14336,2,8,2,1,balanced,0.11103467146555583
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,4096,14336,2,8,2,1,balanced,0.21215466658274332
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,4096,14336,2,8,2,1,balanced,0.19083199898401895
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,4096,14336,2,8,2,1,balanced,0.21175465981165567
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,4096,14336,2,8,2,1,balanced,0.19486933946609497
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,4096,14336,2,8,2,1,balanced,0.21382399400075278
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,4096,14336,2,8,2,1,power_law_1.01,0.10364799499511719
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,4096,14336,2,8,2,1,balanced,0.21701333920160928
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,4096,14336,2,8,2,1,balanced,0.19707733392715454
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,4096,14336,2,8,2,1,balanced,0.23718400796254477
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,4096,14336,2,8,2,1,power_law_1.01,0.14342399835586547
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,4096,14336,2,8,2,1,balanced,0.1994453271230062
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,4096,14336,2,8,2,1,power_law_1.01,0.1852031946182251
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,4096,14336,2,8,2,1,balanced,0.2465226650238037
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,4096,14336,2,8,2,1,balanced,0.2507573366165161
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,4096,14336,2,8,2,1,power_law_1.01,0.3509056091308594
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,4096,14336,2,8,2,1,balanced,0.20187199115753174
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,4096,14336,2,8,2,1,balanced,0.2626720070838928
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,4096,14336,2,8,2,1,power_law_1.01,0.3348479986190796
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,4096,14336,2,8,2,1,balanced,0.20341867208480835
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,4096,14336,2,8,2,1,balanced,0.35174934069315594
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,4096,14336,2,8,2,1,power_law_1.01,0.3625792026519775
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,4096,14336,2,8,2,1,power_law_1.01,0.3765887975692749
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,4096,14336,2,8,2,1,balanced,0.3431573311487834
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,4096,14336,2,8,2,1,power_law_1.01,0.07333120107650756
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,4096,14336,2,8,2,1,power_law_1.01,0.3692352056503296
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,4096,14336,2,8,2,1,balanced,0.4745599826176961
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,4096,14336,2,8,2,1,power_law_1.01,0.38816640377044676
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,4096,14336,2,8,2,1,power_law_1.01,0.08917760252952575
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,4096,14336,2,8,2,1,balanced,0.5883146524429321
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,4096,14336,2,8,2,1,power_law_1.01,0.3897792100906372
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,4096,14336,2,8,2,1,power_law_1.01,0.11131520271301269
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,4096,14336,2,8,2,1,balanced,0.20716800292332968
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,4096,14336,2,8,2,1,balanced,0.8563253084818522
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,4096,14336,2,8,2,1,power_law_1.01,0.4142335891723633
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,4096,14336,2,8,2,1,power_law_1.01,0.18853759765625
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,4096,14336,2,8,2,1,balanced,0.21007466316223145
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,4096,14336,2,8,2,1,power_law_1.01,0.06885120272636414
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,4096,14336,2,8,2,1,power_law_1.01,0.43926401138305665
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,4096,14336,2,8,2,1,power_law_1.01,0.19333759546279908
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,4096,14336,2,8,2,1,balanced,1.1195092995961506
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,4096,14336,2,8,2,1,power_law_1.01,0.44620800018310547
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,4096,14336,2,8,2,1,power_law_1.01,0.20623359680175782
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,4096,14336,2,8,2,1,power_law_1.01,0.08906239867210389
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,4096,14336,2,8,2,1,balanced,1.6274773279825847
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,4096,14336,2,8,2,1,power_law_1.01,0.21623680591583253
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,4096,14336,2,8,2,1,power_law_1.2,0.10420479774475097
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,4096,14336,2,8,2,1,power_law_1.01,0.47706241607666017
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,4096,14336,2,8,2,1,power_law_1.01,0.10251519680023194
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,4096,14336,2,8,2,1,power_law_1.01,0.21274240016937257
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,4096,14336,2,8,2,1,power_law_1.01,0.49681921005249025
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,4096,14336,2,8,2,1,power_law_1.2,0.15196800231933594
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,4096,14336,2,8,2,1,power_law_1.01,0.1856384038925171
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,4096,14336,2,8,2,1,balanced,2.147530714670817
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,4096,14336,2,8,2,1,power_law_1.01,0.21566081047058105
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,4096,14336,2,8,2,1,power_law_1.01,0.5009920120239257
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,4096,14336,2,8,2,1,power_law_1.2,0.17768319845199584
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,4096,14336,2,8,2,1,power_law_1.01,0.1948032021522522
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,4096,14336,2,8,2,1,power_law_1.01,0.21860480308532715
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,4096,14336,2,8,2,1,power_law_1.2,0.3500607967376709
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,4096,14336,2,8,2,1,balanced,0.21964800357818604
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,4096,14336,2,8,2,1,power_law_1.01,0.589792013168335
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,4096,14336,2,8,2,1,power_law_1.01,0.2093440055847168
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,4096,14336,2,8,2,1,power_law_1.01,0.23158400058746337
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,4096,14336,2,8,2,1,balanced,3.185098648071289
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,4096,14336,2,8,2,1,power_law_1.2,0.3431616067886353
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,4096,14336,2,8,2,1,power_law_1.01,0.677561616897583
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,4096,14336,2,8,2,1,power_law_1.01,0.2252351999282837
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,4096,14336,2,8,2,1,balanced,0.22553600867589316
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,4096,14336,2,8,2,1,power_law_1.01,0.2335103988647461
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,4096,14336,2,8,2,1,power_law_1.2,0.36674559116363525
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,4096,14336,2,8,2,1,balanced,0.23105067014694214
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,4096,14336,2,8,2,1,power_law_1.01,0.24972159862518312
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,4096,14336,2,8,2,1,power_law_1.01,0.7344448089599609
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,4096,14336,2,8,2,1,power_law_1.01,0.25259521007537844
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,4096,14336,2,8,2,1,power_law_1.2,0.38105599880218505
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,4096,14336,2,8,2,1,balanced,0.2385653257369995
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,4096,14336,2,8,2,1,power_law_1.01,0.2786303997039795
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,4096,14336,2,8,2,1,power_law_1.01,0.9678079605102539
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,4096,14336,2,8,2,1,balanced,4.287226676940918
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,4096,14336,2,8,2,1,balanced,0.2719200054804484
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,4096,14336,2,8,2,1,power_law_1.2,0.3753599882125854
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,4096,14336,2,8,2,1,power_law_1.01,0.28859519958496094
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,4096,14336,2,8,2,1,balanced,0.28097599744796753
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,4096,14336,2,8,2,1,power_law_1.01,1.1530688285827637
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,4096,14336,2,8,2,1,power_law_1.01,0.2354048013687134
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,4096,14336,2,8,2,1,power_law_1.2,0.387225604057312
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,4096,14336,2,8,2,1,power_law_1.01,0.29344639778137205
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,4096,14336,2,8,2,1,balanced,0.29739199082056683
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,4096,14336,2,8,2,1,power_law_1.01,1.604172706604004
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,4096,14336,2,8,2,1,power_law_1.01,0.3140160083770752
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,4096,14336,2,8,2,1,power_law_1.01,0.24506239891052245
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,4096,14336,2,8,2,1,power_law_1.2,0.39991040229797364
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,4096,14336,2,8,2,1,balanced,0.4440426826477051
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,4096,14336,2,8,2,1,balanced,5.276501337687175
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,4096,14336,2,8,2,1,power_law_1.01,0.3937279939651489
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,4096,14336,2,8,2,1,power_law_1.01,2.058444786071777
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,4096,14336,2,8,2,1,balanced,0.4863733450571696
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,4096,14336,2,8,2,1,power_law_1.2,0.41072640419006345
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,4096,14336,2,8,2,1,balanced,0.7146133581797282
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,4096,14336,2,8,2,1,power_law_1.01,0.4319808006286621
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,4096,14336,2,8,2,1,power_law_1.2,0.42351360321044923
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,4096,14336,2,8,2,1,power_law_1.01,2.878463935852051
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,4096,14336,2,8,2,1,power_law_1.01,0.23432960510253906
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,4096,14336,2,8,2,1,balanced,0.9723520278930664
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,4096,14336,2,8,2,1,power_law_1.01,0.5622591972351074
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,4096,14336,2,8,2,1,power_law_1.2,0.4441664218902588
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,4096,14336,2,8,2,1,power_law_1.01,3.874796676635742
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,4096,14336,2,8,2,1,power_law_1.01,0.24968318939208983
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,4096,14336,2,8,2,1,power_law_1.01,0.6714879989624023
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,4096,14336,2,8,2,1,balanced,1.4416693051656086
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,4096,14336,2,8,2,1,power_law_1.2,0.48616318702697753
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,4096,14336,2,8,2,1,power_law_1.2,0.07382400035858154
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,4096,14336,2,8,2,1,balanced,8.506048202514648
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,4096,14336,2,8,2,1,power_law_1.01,0.2531647920608521
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,4096,14336,2,8,2,1,power_law_1.01,0.9463423728942871
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,4096,14336,2,8,2,1,power_law_1.2,0.5028543949127198
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,4096,14336,2,8,2,1,balanced,1.919365406036377
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,4096,14336,2,8,2,1,power_law_1.01,5.7642559051513675
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,4096,14336,2,8,2,1,power_law_1.2,0.08517760038375854
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,4096,14336,2,8,2,1,power_law_1.01,0.2928447961807251
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,4096,14336,2,8,2,1,power_law_1.01,1.2069567680358886
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,4096,14336,2,8,2,1,power_law_1.2,0.5070464134216308
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,4096,14336,2,8,2,1,balanced,2.875136057535807
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,4096,14336,2,8,2,1,power_law_1.2,0.12617599964141846
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,4096,14336,2,8,2,1,power_law_1.01,7.601599884033203
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,4096,14336,2,8,2,1,power_law_1.01,0.3055936098098755
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,4096,14336,2,8,2,1,power_law_1.01,1.725222396850586
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,4096,14336,2,8,2,1,power_law_1.2,0.6017727851867676
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,4096,14336,2,8,2,1,power_law_1.2,0.1841472029685974
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,4096,14336,2,8,2,1,balanced,3.7941548029581704
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,4096,14336,2,8,2,1,power_law_1.01,0.32366719245910647
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,4096,14336,2,8,2,1,power_law_1.01,2.2303232192993163
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,4096,14336,2,8,2,1,power_law_1.01,9.477324676513671
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,4096,14336,2,8,2,1,power_law_1.2,0.1923200011253357
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,4096,14336,2,8,2,1,power_law_1.2,0.6680960178375244
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,4096,14336,2,8,2,1,power_law_1.01,0.37251839637756345
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,4096,14336,2,8,2,1,power_law_1.2,0.20275840759277344
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,4096,14336,2,8,2,1,power_law_1.01,3.238118362426758
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,4096,14336,2,8,2,1,power_law_1.2,0.7474880218505859
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,4096,14336,2,8,2,1,power_law_1.2,0.20963199138641359
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,4096,14336,2,8,2,1,balanced,5.688245137532552
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,4096,14336,2,8,2,1,power_law_1.01,0.483244800567627
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,4096,14336,2,8,2,1,power_law_1.01,15.370547485351562
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,4096,14336,2,8,2,1,power_law_1.2,0.9537343978881836
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,4096,14336,2,8,2,1,power_law_1.01,4.351456069946289
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,4096,14336,2,8,2,1,power_law_1.2,0.2128511905670166
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,4096,14336,2,8,2,1,power_law_1.01,0.6010111808776856
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,4096,14336,2,8,2,1,power_law_1.2,1.1459648132324218
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,4096,14336,2,8,2,1,power_law_1.01,5.428262329101562
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,4096,14336,2,8,2,1,power_law_1.2,0.2182080030441284
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,4096,14336,2,8,2,1,balanced,17.134240468343098
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,4096,14336,2,8,2,1,power_law_1.01,0.8336704254150391
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,4096,14336,2,8,2,1,balanced,7.552757263183594
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,4096,14336,2,8,2,1,power_law_1.2,1.616819190979004
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,4096,14336,2,8,2,1,power_law_1.2,0.2157439947128296
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,4096,14336,2,8,2,1,power_law_1.01,29.9441162109375
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,4096,14336,2,8,2,1,power_law_1.01,8.609452819824218
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,4096,14336,2,8,2,1,power_law_1.01,1.070918369293213
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,4096,14336,2,8,2,1,power_law_1.2,0.06878079771995545
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,4096,14336,2,8,2,1,power_law_1.2,0.22938880920410157
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,4096,14336,2,8,2,1,power_law_1.2,2.040934371948242
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,4096,14336,2,8,2,1,power_law_1.2,0.2371135950088501
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,4096,14336,2,8,2,1,power_law_1.2,0.08107519745826722
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,4096,14336,2,8,2,1,power_law_1.01,1.5486271858215332
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,4096,14336,2,8,2,1,power_law_1.2,2.9522560119628904
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,4096,14336,2,8,2,1,power_law_1.2,0.09757440090179444
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,4096,14336,2,8,2,1,power_law_1.01,17.141030883789064
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,4096,14336,2,8,2,1,power_law_1.2,0.24440960884094237
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,4096,14336,2,8,2,1,power_law_1.01,2.016223907470703
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,4096,14336,2,8,2,1,balanced,9.462506612141928
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,4096,14336,2,8,2,1,power_law_1.2,0.19376640319824218
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,4096,14336,2,8,2,1,power_law_1.2,3.8669502258300783
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,4096,14336,2,8,2,1,power_law_1.2,0.2729023933410645
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,4096,14336,2,8,2,1,power_law_1.2,0.19114240407943725
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,4096,14336,2,8,2,1,power_law_1.01,2.947494316101074
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,4096,14336,2,8,2,1,power_law_1.2,0.2168191909790039
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,4096,14336,2,8,2,1,power_law_1.2,0.29054720401763917
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,4096,14336,2,8,2,1,power_law_1.2,5.797068786621094
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,4096,14336,2,8,2,1,power_law_1.2,0.2228287935256958
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,4096,14336,2,8,2,1,power_law_1.01,3.8912830352783203
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,4096,14336,2,8,2,1,power_law_1.2,0.30357120037078855
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,4096,14336,2,8,2,1,power_law_1.2,0.2508671998977661
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,4096,14336,2,8,2,1,power_law_1.2,7.580998229980469
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,4096,14336,2,8,2,1,power_law_1.2,0.32318720817565916
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,4096,14336,2,8,2,1,power_law_1.01,5.780607986450195
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,4096,14336,2,8,2,1,power_law_1.2,0.37160959243774416
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,4096,14336,2,8,2,1,balanced,15.21679433186849
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,4096,14336,2,8,2,1,power_law_1.2,0.236844801902771
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,4096,14336,2,8,2,1,power_law_1.2,9.374015808105469
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,4096,14336,2,8,2,1,power_law_1.01,7.672415924072266
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,4096,14336,2,8,2,1,power_law_1.2,0.4250175952911377
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,4096,14336,2,8,2,1,power_law_1.2,0.2508415937423706
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,4096,14336,2,8,2,1,power_law_1.2,0.5566656112670898
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,4096,14336,2,8,2,1,power_law_1.2,15.333261108398437
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,4096,14336,2,8,2,1,power_law_1.01,9.582041931152343
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,4096,14336,2,8,2,1,power_law_1.2,0.6949183940887451
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,4096,14336,2,8,2,1,power_law_1.2,0.23664000034332275
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,4096,14336,2,8,2,1,power_law_1.2,0.250220799446106
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,4096,14336,2,8,2,1,power_law_1.2,0.9508864402770996
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,4096,14336,2,8,2,1,power_law_1.2,29.720596313476562
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,4096,14336,2,8,2,1,power_law_1.01,15.2849853515625
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,4096,14336,2,8,2,1,power_law_1.2,0.25890560150146485
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,4096,14336,2,8,2,1,power_law_1.2,1.193017578125
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,4096,14336,2,8,2,1,power_law_1.2,0.29205119609832764
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,4096,14336,2,8,2,1,power_law_1.2,1.7183551788330078
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,4096,14336,2,8,2,1,power_law_1.2,0.3095616102218628
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,4096,14336,2,8,2,1,power_law_1.2,0.3206655979156494
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,4096,14336,2,8,2,1,power_law_1.2,2.2060224533081056
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,4096,14336,2,8,2,1,power_law_1.01,31.100442504882814
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,4096,14336,2,8,2,1,power_law_1.2,0.3686336040496826
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,4096,14336,2,8,2,1,balanced,31.998613993326824
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,4096,14336,2,8,2,1,power_law_1.2,0.4870463848114014
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,4096,14336,2,8,2,1,power_law_1.2,3.2439041137695312
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,4096,14336,2,8,2,1,power_law_1.2,0.6009407997131347
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,4096,14336,2,8,2,1,power_law_1.2,4.365375900268555
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,4096,14336,2,8,2,1,power_law_1.2,0.8373632431030273
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,4096,14336,2,8,2,1,power_law_1.2,1.066220760345459
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,4096,14336,2,8,2,1,power_law_1.2,5.419430541992187
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,4096,14336,2,8,2,1,power_law_1.2,1.5424063682556153
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,4096,14336,2,8,2,1,power_law_1.2,2.014188766479492
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,4096,14336,2,8,2,1,power_law_1.2,8.686994934082032
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,4096,14336,2,8,2,1,power_law_1.2,2.9440704345703126
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,4096,14336,2,8,2,1,power_law_1.2,3.859423828125
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,4096,14336,2,8,2,1,power_law_1.2,17.134431457519533
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,4096,14336,2,8,2,1,power_law_1.2,5.756646347045899
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,4096,14336,2,8,2,1,power_law_1.2,7.659852600097656
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,4096,14336,2,8,2,1,power_law_1.2,9.547257232666016
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,4096,14336,2,8,2,1,power_law_1.2,15.292857360839843
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,4096,14336,2,8,2,1,power_law_1.2,31.164556884765624
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,6144,16384,2,8,1,2,balanced,0.10598400235176086
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,6144,16384,2,8,1,2,balanced,0.16781334082285562
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,6144,16384,2,8,1,2,balanced,0.1744800011316935
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,6144,16384,2,8,1,2,balanced,0.31033066908518475
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,6144,16384,2,8,1,2,balanced,0.3115893403689067
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,6144,16384,2,8,1,2,balanced,0.5868533452351888
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,6144,16384,2,8,1,2,balanced,0.5845226844151815
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,6144,16384,2,8,1,2,balanced,0.3168320059776306
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,6144,16384,2,8,1,2,power_law_1.01,0.24119679927825927
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,6144,16384,2,8,1,2,balanced,0.5818133354187012
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,6144,16384,2,8,1,2,balanced,0.3195199966430664
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,6144,16384,2,8,1,2,power_law_1.01,0.34599039554595945
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,6144,16384,2,8,1,2,balanced,0.5825013319651285
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,6144,16384,2,8,1,2,balanced,0.3173759977022807
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,6144,16384,2,8,1,2,power_law_1.01,0.3819648027420044
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,6144,16384,2,8,1,2,balanced,0.5867146650950114
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,6144,16384,2,8,1,2,balanced,0.31993599732716876
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,6144,16384,2,8,1,2,balanced,0.10969066619873047
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,6144,16384,2,8,1,2,balanced,0.5861440102259318
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,6144,16384,2,8,1,2,power_law_1.01,0.5375872135162354
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,6144,16384,2,8,1,2,balanced,0.3245866696039836
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,6144,16384,2,8,1,2,balanced,0.6136800050735474
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,6144,16384,2,8,1,2,balanced,0.17404800653457642
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,6144,16384,2,8,1,2,power_law_1.01,0.5602943897247314
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,6144,16384,2,8,1,2,balanced,0.3280319968859355
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,6144,16384,2,8,1,2,balanced,0.6143626769383749
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,6144,16384,2,8,1,2,balanced,0.3123626708984375
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,6144,16384,2,8,1,2,power_law_1.01,0.614412784576416
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,6144,16384,2,8,1,2,balanced,0.32684799035390216
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,6144,16384,2,8,1,2,balanced,0.6250933408737183
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,6144,16384,2,8,1,2,balanced,0.3163839975992839
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,6144,16384,2,8,1,2,power_law_1.01,0.6350592136383056
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,6144,16384,2,8,1,2,power_law_1.01,0.19106559753417968
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,6144,16384,2,8,1,2,balanced,0.34348801771799725
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,6144,16384,2,8,1,2,balanced,0.6244853337605795
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,6144,16384,2,8,1,2,balanced,0.3185439904530843
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,6144,16384,2,8,1,2,power_law_1.01,0.626361608505249
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,6144,16384,2,8,1,2,balanced,0.3369866609573364
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,6144,16384,2,8,1,2,balanced,0.629962682723999
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,6144,16384,2,8,1,2,power_law_1.01,0.1617792010307312
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,6144,16384,2,8,1,2,balanced,0.3208853403727214
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,6144,16384,2,8,1,2,power_law_1.01,0.6633408069610596
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,6144,16384,2,8,1,2,balanced,0.3398880163828532
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,6144,16384,2,8,1,2,balanced,0.6552746693293253
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,6144,16384,2,8,1,2,power_law_1.01,0.1894976019859314
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,6144,16384,2,8,1,2,power_law_1.01,0.1509503960609436
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,6144,16384,2,8,1,2,balanced,0.3238346576690674
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,6144,16384,2,8,1,2,power_law_1.01,0.6855679988861084
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,6144,16384,2,8,1,2,balanced,0.36849065621693927
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,6144,16384,2,8,1,2,balanced,0.6588480075200399
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,6144,16384,2,8,1,2,power_law_1.01,0.3165503978729248
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,6144,16384,2,8,1,2,balanced,0.324069341023763
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,6144,16384,2,8,1,2,power_law_1.01,0.6814784049987793
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,6144,16384,2,8,1,2,power_law_1.01,0.1899135947227478
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,6144,16384,2,8,1,2,balanced,0.6595946550369263
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,6144,16384,2,8,1,2,balanced,0.3740373452504476
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,6144,16384,2,8,1,2,power_law_1.01,0.3195136070251465
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,6144,16384,2,8,1,2,power_law_1.01,0.7458687782287597
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,6144,16384,2,8,1,2,power_law_1.01,0.22315518856048583
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,6144,16384,2,8,1,2,balanced,0.6966400146484375
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,6144,16384,2,8,1,2,balanced,0.3761599858601888
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,6144,16384,2,8,1,2,power_law_1.01,0.3274431943893433
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,6144,16384,2,8,1,2,power_law_1.01,0.8416704177856446
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,6144,16384,2,8,1,2,power_law_1.01,0.3174272060394287
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,6144,16384,2,8,1,2,balanced,0.9082079728444418
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,6144,16384,2,8,1,2,balanced,0.39053332805633545
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,6144,16384,2,8,1,2,power_law_1.01,0.3383039951324463
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,6144,16384,2,8,1,2,power_law_1.01,0.7701312065124511
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,6144,16384,2,8,1,2,power_law_1.01,0.30792319774627686
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,6144,16384,2,8,1,2,balanced,0.9115306536356608
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,6144,16384,2,8,1,2,balanced,0.528714656829834
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,6144,16384,2,8,1,2,balanced,0.33079467217127484
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,6144,16384,2,8,1,2,power_law_1.2,0.2874687910079956
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,6144,16384,2,8,1,2,power_law_1.01,0.33092479705810546
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,6144,16384,2,8,1,2,power_law_1.01,0.9083840370178222
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,6144,16384,2,8,1,2,power_law_1.01,0.370195198059082
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,6144,16384,2,8,1,2,balanced,1.269765297571818
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,6144,16384,2,8,1,2,balanced,0.5406026840209961
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,6144,16384,2,8,1,2,balanced,0.334549347559611
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,6144,16384,2,8,1,2,power_law_1.2,0.30789759159088137
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,6144,16384,2,8,1,2,power_law_1.01,0.41081600189208983
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,6144,16384,2,8,1,2,power_law_1.01,1.0220928192138672
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,6144,16384,2,8,1,2,balanced,1.528282642364502
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,6144,16384,2,8,1,2,power_law_1.01,0.34561278820037844
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,6144,16384,2,8,1,2,power_law_1.2,0.3827199935913086
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,6144,16384,2,8,1,2,balanced,0.7451466719309489
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,6144,16384,2,8,1,2,power_law_1.2,0.5827455997467041
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,6144,16384,2,8,1,2,power_law_1.01,0.4433023929595947
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,6144,16384,2,8,1,2,power_law_1.01,1.0170751571655274
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,6144,16384,2,8,1,2,balanced,2.3087573051452637
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,6144,16384,2,8,1,2,power_law_1.2,0.5819712162017823
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,6144,16384,2,8,1,2,power_law_1.01,0.36579198837280275
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,6144,16384,2,8,1,2,balanced,0.8813333511352539
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,6144,16384,2,8,1,2,power_law_1.2,0.6077184200286865
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,6144,16384,2,8,1,2,power_law_1.01,1.2165696144104003
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,6144,16384,2,8,1,2,power_law_1.2,0.17624319791793824
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,6144,16384,2,8,1,2,power_law_1.2,0.6362815856933594
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,6144,16384,2,8,1,2,balanced,2.9643306732177734
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,6144,16384,2,8,1,2,power_law_1.01,0.3937279939651489
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,6144,16384,2,8,1,2,balanced,1.3227360248565674
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,6144,16384,2,8,1,2,power_law_1.01,1.5057024002075194
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,6144,16384,2,8,1,2,power_law_1.2,0.622976016998291
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,6144,16384,2,8,1,2,power_law_1.01,0.43543038368225095
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,6144,16384,2,8,1,2,power_law_1.2,0.20697600841522218
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,6144,16384,2,8,1,2,power_law_1.2,0.6762879848480224
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,6144,16384,2,8,1,2,power_law_1.01,0.42709760665893554
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,6144,16384,2,8,1,2,power_law_1.01,1.8717567443847656
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,6144,16384,2,8,1,2,balanced,1.6887466112772624
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,6144,16384,2,8,1,2,balanced,4.583162625630696
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,6144,16384,2,8,1,2,power_law_1.01,0.45087361335754395
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,6144,16384,2,8,1,2,power_law_1.2,0.6764416217803955
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,6144,16384,2,8,1,2,power_law_1.2,0.20609920024871825
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,6144,16384,2,8,1,2,balanced,0.34034132957458496
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,6144,16384,2,8,1,2,power_law_1.2,0.7192319869995117
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,6144,16384,2,8,1,2,power_law_1.01,0.4720895767211914
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,6144,16384,2,8,1,2,power_law_1.01,2.2374143600463867
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,6144,16384,2,8,1,2,power_law_1.2,0.31661438941955566
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,6144,16384,2,8,1,2,power_law_1.2,0.8242560386657715
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,6144,16384,2,8,1,2,balanced,2.466911951700846
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,6144,16384,2,8,1,2,balanced,0.3444639841715495
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,6144,16384,2,8,1,2,balanced,5.885477066040039
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,6144,16384,2,8,1,2,power_law_1.01,0.43941760063171387
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,6144,16384,2,8,1,2,power_law_1.2,0.8055487632751465
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,6144,16384,2,8,1,2,power_law_1.01,4.046131134033203
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,6144,16384,2,8,1,2,power_law_1.2,0.3195904016494751
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,6144,16384,2,8,1,2,power_law_1.01,0.394649600982666
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,6144,16384,2,8,1,2,power_law_1.2,0.819001579284668
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,6144,16384,2,8,1,2,balanced,0.35256532828013104
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,6144,16384,2,8,1,2,power_law_1.01,0.5636544227600098
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,6144,16384,2,8,1,2,power_law_1.2,0.32023038864135744
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,6144,16384,2,8,1,2,power_law_1.01,4.356768035888672
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,6144,16384,2,8,1,2,power_law_1.2,0.9007935523986816
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,6144,16384,2,8,1,2,balanced,3.2702881495157876
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,6144,16384,2,8,1,2,power_law_1.01,0.41626877784729005
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,6144,16384,2,8,1,2,balanced,0.3595786492029826
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,6144,16384,2,8,1,2,power_law_1.2,0.9110976219177246
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,6144,16384,2,8,1,2,power_law_1.01,0.6012224197387696
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,6144,16384,2,8,1,2,balanced,9.229349136352539
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,6144,16384,2,8,1,2,power_law_1.2,0.3431936025619507
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,6144,16384,2,8,1,2,power_law_1.2,1.0132351875305177
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,6144,16384,2,8,1,2,power_law_1.01,0.4395008087158203
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,6144,16384,2,8,1,2,power_law_1.01,8.069522857666016
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,6144,16384,2,8,1,2,power_law_1.01,0.5853888034820557
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,6144,16384,2,8,1,2,power_law_1.2,1.2989376068115235
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,6144,16384,2,8,1,2,power_law_1.2,0.3363584041595459
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,6144,16384,2,8,1,2,balanced,4.946015993754069
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,6144,16384,2,8,1,2,power_law_1.01,0.5473343849182128
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,6144,16384,2,8,1,2,power_law_1.2,1.5726719856262208
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,6144,16384,2,8,1,2,power_law_1.01,0.7379968166351318
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,6144,16384,2,8,1,2,power_law_1.01,8.997618865966796
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,6144,16384,2,8,1,2,power_law_1.2,0.36459519863128664
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,6144,16384,2,8,1,2,power_law_1.2,2.00314884185791
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,6144,16384,2,8,1,2,balanced,12.406501770019531
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,6144,16384,2,8,1,2,balanced,0.392959992090861
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,6144,16384,2,8,1,2,power_law_1.01,0.8516415596008301
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,6144,16384,2,8,1,2,power_law_1.2,2.4862464904785155
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,6144,16384,2,8,1,2,power_law_1.01,0.5087935924530029
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,6144,16384,2,8,1,2,power_law_1.2,0.36625919342041013
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,6144,16384,2,8,1,2,power_law_1.01,12.121024322509765
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,6144,16384,2,8,1,2,balanced,0.4014879862467448
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,6144,16384,2,8,1,2,power_law_1.2,4.081804656982422
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,6144,16384,2,8,1,2,balanced,6.47047487894694
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,6144,16384,2,8,1,2,power_law_1.01,1.1784959793090821
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,6144,16384,2,8,1,2,power_law_1.2,0.38144640922546386
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,6144,16384,2,8,1,2,power_law_1.01,0.5618495941162109
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,6144,16384,2,8,1,2,power_law_1.2,5.127296066284179
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,6144,16384,2,8,1,2,balanced,0.4230773448944092
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,6144,16384,2,8,1,2,power_law_1.2,0.41797761917114257
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,6144,16384,2,8,1,2,power_law_1.01,1.3984959602355957
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,6144,16384,2,8,1,2,power_law_1.01,0.6222720146179199
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,6144,16384,2,8,1,2,power_law_1.01,18.50563201904297
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,6144,16384,2,8,1,2,balanced,15.426666259765625
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,6144,16384,2,8,1,2,power_law_1.2,8.42899169921875
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,6144,16384,2,8,1,2,balanced,0.6574613253275553
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,6144,16384,2,8,1,2,power_law_1.2,0.4355455875396729
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,6144,16384,2,8,1,2,power_law_1.01,0.9609151840209961
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,6144,16384,2,8,1,2,power_law_1.01,2.0074623107910154
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,6144,16384,2,8,1,2,power_law_1.2,10.47523193359375
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,6144,16384,2,8,1,2,balanced,0.6960586706797282
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,6144,16384,2,8,1,2,power_law_1.2,0.4984000205993652
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,6144,16384,2,8,1,2,balanced,8.306490580240885
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,6144,16384,2,8,1,2,power_law_1.01,1.1104448318481446
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,6144,16384,2,8,1,2,power_law_1.01,2.70196475982666
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,6144,16384,2,8,1,2,power_law_1.01,24.179046630859375
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,6144,16384,2,8,1,2,power_law_1.2,0.5791168212890625
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,6144,16384,2,8,1,2,power_law_1.2,16.899256896972656
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,6144,16384,2,8,1,2,power_law_1.01,4.043827056884766
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,6144,16384,2,8,1,2,power_law_1.2,0.5995007991790772
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,6144,16384,2,8,1,2,power_law_1.01,6.413926696777343
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,6144,16384,2,8,1,2,power_law_1.2,20.14344940185547
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,6144,16384,2,8,1,2,power_law_1.2,0.5801536083221436
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,6144,16384,2,8,1,2,balanced,24.481430053710938
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,6144,16384,2,8,1,2,balanced,1.0432533423105876
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,6144,16384,2,8,1,2,power_law_1.01,1.5415743827819823
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,6144,16384,2,8,1,2,power_law_1.01,37.47088623046875
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,6144,16384,2,8,1,2,power_law_1.2,0.7539008140563965
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,6144,16384,2,8,1,2,balanced,13.904336293538412
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,6144,16384,2,8,1,2,power_law_1.01,8.735257720947265
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,6144,16384,2,8,1,2,power_law_1.01,2.2189119338989256
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,6144,16384,2,8,1,2,balanced,1.3849813143412273
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,6144,16384,2,8,1,2,power_law_1.2,0.872652816772461
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,6144,16384,2,8,1,2,power_law_1.2,31.405972290039063
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,6144,16384,2,8,1,2,power_law_1.2,0.9873600006103516
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,6144,16384,2,8,1,2,power_law_1.01,3.6118335723876953
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,6144,16384,2,8,1,2,power_law_1.01,10.180608367919922
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,6144,16384,2,8,1,2,balanced,2.0848159790039062
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,6144,16384,2,8,1,2,power_law_1.2,1.5013440132141114
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,6144,16384,2,8,1,2,power_law_1.01,4.813452911376953
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,6144,16384,2,8,1,2,balanced,2.80297056833903
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,6144,16384,2,8,1,2,power_law_1.2,2.0943744659423826
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,6144,16384,2,8,1,2,power_law_1.2,38.9770751953125
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,6144,16384,2,8,1,2,power_law_1.01,14.19562225341797
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,6144,16384,2,8,1,2,power_law_1.01,6.510150146484375
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,6144,16384,2,8,1,2,power_law_1.2,2.647660827636719
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,6144,16384,2,8,1,2,balanced,4.257317225138347
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,6144,16384,2,8,1,2,power_law_1.01,89.84725341796874
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,6144,16384,2,8,1,2,power_law_1.01,8.859238433837891
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,6144,16384,2,8,1,2,power_law_1.2,4.069472122192383
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,6144,16384,2,8,1,2,power_law_1.01,28.623751831054687
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,6144,16384,2,8,1,2,balanced,5.707701365152995
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,6144,16384,2,8,1,2,balanced,48.9831797281901
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,6144,16384,2,8,1,2,power_law_1.2,5.724396896362305
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,6144,16384,2,8,1,2,power_law_1.01,13.271980285644531
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,6144,16384,2,8,1,2,balanced,27.62506612141927
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,6144,16384,2,8,1,2,power_law_1.2,10.058719635009766
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,6144,16384,2,8,1,2,power_law_1.01,31.742401123046875
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,6144,16384,2,8,1,2,power_law_1.2,93.85799560546874
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,6144,16384,2,8,1,2,balanced,8.555013020833334
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,6144,16384,2,8,1,2,power_law_1.01,18.602969360351562
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,6144,16384,2,8,1,2,power_law_1.2,12.356441497802734
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,6144,16384,2,8,1,2,power_law_1.01,24.179974365234376
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,6144,16384,2,8,1,2,balanced,11.690559387207031
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,6144,16384,2,8,1,2,power_law_1.2,15.556031799316406
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,6144,16384,2,8,1,2,power_law_1.2,22.730073547363283
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,6144,16384,2,8,1,2,power_law_1.01,44.61416931152344
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,6144,16384,2,8,1,2,balanced,14.921029408772787
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,6144,16384,2,8,1,2,power_law_1.2,44.85296630859375
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,6144,16384,2,8,1,2,balanced,25.328598022460938
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,6144,16384,2,8,1,2,power_law_1.01,89.13689575195312
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,6144,16384,2,8,1,2,balanced,54.672576904296875
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,6144,16384,2,8,2,1,balanced,0.10327466328938802
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,6144,16384,2,8,2,1,balanced,0.18305067221323648
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,6144,16384,2,8,2,1,power_law_1.01,0.11141760349273681
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,6144,16384,2,8,2,1,power_law_1.01,0.18229119777679442
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,6144,16384,2,8,2,1,balanced,0.17242666085561117
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,6144,16384,2,8,2,1,balanced,0.30398400624593097
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,6144,16384,2,8,2,1,power_law_1.01,0.14610559940338136
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,6144,16384,2,8,2,1,power_law_1.01,0.25770881175994875
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,6144,16384,2,8,2,1,balanced,0.3081973393758138
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,6144,16384,2,8,1,2,power_law_1.2,0.16301440000534057
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,6144,16384,2,8,2,1,balanced,0.5714986721674601
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,6144,16384,2,8,2,1,power_law_1.01,0.17341439723968505
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,6144,16384,2,8,2,1,power_law_1.01,0.2550528049468994
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,6144,16384,2,8,2,1,balanced,0.31301333506902057
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,6144,16384,2,8,1,2,power_law_1.2,0.1621567964553833
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,6144,16384,2,8,2,1,balanced,0.5748106638590494
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,6144,16384,2,8,2,1,power_law_1.01,0.30053119659423827
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,6144,16384,2,8,2,1,power_law_1.01,0.5743103981018066
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,6144,16384,2,8,2,1,balanced,0.3130026658376058
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,6144,16384,2,8,1,2,power_law_1.2,0.22294399738311768
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,6144,16384,2,8,2,1,balanced,0.5775200128555298
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,6144,16384,2,8,2,1,balanced,0.10827733079592387
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,6144,16384,2,8,2,1,power_law_1.01,0.1002303957939148
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,6144,16384,2,8,2,1,balanced,0.31489600737889606
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,6144,16384,2,8,2,1,power_law_1.01,0.31296639442443847
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,6144,16384,2,8,2,1,power_law_1.01,0.5539008140563965
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,6144,16384,2,8,1,2,power_law_1.2,0.31763200759887694
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,6144,16384,2,8,2,1,balanced,0.5793386697769165
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,6144,16384,2,8,2,1,balanced,0.1728960076967875
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,6144,16384,2,8,2,1,balanced,0.31990400950113934
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,6144,16384,2,8,2,1,power_law_1.01,0.1245695948600769
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,6144,16384,2,8,2,1,power_law_1.01,0.5820799827575683
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,6144,16384,2,8,2,1,power_law_1.01,0.32247679233551024
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,6144,16384,2,8,1,2,power_law_1.2,0.3190464019775391
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,6144,16384,2,8,2,1,balanced,0.5845546722412109
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,6144,16384,2,8,2,1,balanced,0.3081653316815694
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,6144,16384,2,8,2,1,balanced,0.3214720090230306
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,6144,16384,2,8,2,1,power_law_1.01,0.15794559717178344
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,6144,16384,2,8,2,1,power_law_1.01,0.34483840465545657
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,6144,16384,2,8,2,1,power_law_1.01,0.5921855926513672
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,6144,16384,2,8,1,2,power_law_1.2,0.35368320941925047
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,6144,16384,2,8,2,1,balanced,0.5861866474151611
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,6144,16384,2,8,2,1,balanced,0.31176533301671344
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,6144,16384,2,8,2,1,balanced,0.323743999004364
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,6144,16384,2,8,2,1,power_law_1.01,0.30600318908691404
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,6144,16384,2,8,2,1,power_law_1.01,0.3305344104766846
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,6144,16384,2,8,2,1,power_law_1.01,0.603769588470459
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,6144,16384,2,8,1,2,power_law_1.2,0.3894207954406738
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,6144,16384,2,8,2,1,balanced,0.6055519978205363
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,6144,16384,2,8,2,1,balanced,0.3259039918581645
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,6144,16384,2,8,2,1,balanced,0.3144693374633789
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,6144,16384,2,8,2,1,power_law_1.01,0.31410560607910154
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,6144,16384,2,8,2,1,power_law_1.01,0.35212159156799316
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,6144,16384,2,8,2,1,power_law_1.01,0.6308671951293945
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,6144,16384,2,8,2,1,balanced,0.3356800079345703
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,6144,16384,2,8,1,2,power_law_1.2,0.44944000244140625
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,6144,16384,2,8,2,1,balanced,0.6079466740290324
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,6144,16384,2,8,2,1,balanced,0.3176693320274353
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,6144,16384,2,8,2,1,power_law_1.2,0.16581120491027831
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,6144,16384,2,8,2,1,power_law_1.01,0.3337984085083008
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,6144,16384,2,8,2,1,power_law_1.01,0.3643903970718384
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,6144,16384,2,8,2,1,power_law_1.01,0.6556352138519287
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,6144,16384,2,8,2,1,balanced,0.3397013346354167
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,6144,16384,2,8,2,1,balanced,0.3211039900779724
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,6144,16384,2,8,2,1,balanced,0.6199466784795126
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,6144,16384,2,8,2,1,power_law_1.01,0.3822783946990967
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,6144,16384,2,8,2,1,power_law_1.01,0.3431296110153198
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,6144,16384,2,8,2,1,power_law_1.01,0.6808191776275635
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,6144,16384,2,8,2,1,power_law_1.2,0.2423487901687622
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,6144,16384,2,8,2,1,balanced,0.32334933678309125
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,6144,16384,2,8,2,1,balanced,0.3407520055770874
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,6144,16384,2,8,2,1,balanced,0.615610678990682
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,6144,16384,2,8,1,2,power_law_1.2,0.42304000854492185
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,6144,16384,2,8,2,1,power_law_1.01,0.3891200065612793
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,6144,16384,2,8,2,1,power_law_1.01,0.40259199142456054
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,6144,16384,2,8,2,1,power_law_1.01,0.6888448238372803
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,6144,16384,2,8,2,1,power_law_1.2,0.3105600118637085
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,6144,16384,2,8,2,1,balanced,0.3664906819661458
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,6144,16384,2,8,2,1,balanced,0.6143306493759155
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,6144,16384,2,8,1,2,power_law_1.2,0.4033984184265137
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,6144,16384,2,8,2,1,power_law_1.01,0.39317760467529295
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,6144,16384,2,8,2,1,power_law_1.01,0.7895040035247802
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,6144,16384,2,8,2,1,balanced,0.36872533957163495
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,6144,16384,2,8,2,1,power_law_1.2,0.5627327919006347
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,6144,16384,2,8,2,1,balanced,0.6630080143610636
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,6144,16384,2,8,2,1,power_law_1.01,0.3985215902328491
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,6144,16384,2,8,2,1,balanced,0.3739519913991292
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,6144,16384,2,8,2,1,power_law_1.01,0.7585152149200439
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,6144,16384,2,8,2,1,balanced,0.6614506642023722
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,6144,16384,2,8,2,1,power_law_1.2,0.576038408279419
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,6144,16384,2,8,2,1,power_law_1.01,0.42644481658935546
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,6144,16384,2,8,2,1,balanced,0.3995893398920695
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,6144,16384,2,8,2,1,balanced,0.32764265934626263
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,6144,16384,2,8,1,2,power_law_1.2,0.39450879096984864
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,6144,16384,2,8,2,1,power_law_1.01,0.38066558837890624
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,6144,16384,2,8,2,1,power_law_1.01,0.8206656455993653
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,6144,16384,2,8,2,1,balanced,0.6626826524734497
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,6144,16384,2,8,2,1,power_law_1.2,0.5927040100097656
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,6144,16384,2,8,2,1,power_law_1.01,0.44391679763793945
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,6144,16384,2,8,2,1,balanced,0.5216960112253824
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,6144,16384,2,8,2,1,balanced,0.33214932680130005
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,6144,16384,2,8,2,1,power_law_1.01,0.4104447841644287
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,6144,16384,2,8,1,2,power_law_1.2,0.44901118278503416
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,6144,16384,2,8,2,1,power_law_1.01,0.8439999580383301
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,6144,16384,2,8,2,1,balanced,0.696389357248942
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,6144,16384,2,8,2,1,power_law_1.2,0.6062399864196777
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,6144,16384,2,8,2,1,power_law_1.01,0.4903679847717285
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,6144,16384,2,8,1,2,power_law_1.2,0.44965758323669436
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,6144,16384,2,8,2,1,balanced,0.5314026673634847
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,6144,16384,2,8,2,1,power_law_1.01,0.8759872436523437
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,6144,16384,2,8,2,1,balanced,0.8709440231323242
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,6144,16384,2,8,2,1,power_law_1.01,0.560588788986206
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,6144,16384,2,8,2,1,power_law_1.2,0.6077951908111572
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,6144,16384,2,8,1,2,power_law_1.2,0.5182528018951416
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,6144,16384,2,8,2,1,power_law_1.01,1.0897024154663086
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,6144,16384,2,8,2,1,balanced,0.7378453413645426
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,6144,16384,2,8,2,1,balanced,0.8654560248057047
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,6144,16384,2,8,2,1,power_law_1.01,0.655072021484375
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,6144,16384,2,8,2,1,power_law_1.2,0.6333824157714844
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,6144,16384,2,8,2,1,power_law_1.01,1.1814528465270997
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,6144,16384,2,8,2,1,balanced,0.9170666535695394
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,6144,16384,2,8,2,1,power_law_1.01,0.8805760383605957
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,6144,16384,2,8,2,1,balanced,1.2286400000254314
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,6144,16384,2,8,1,2,power_law_1.2,0.5349311828613281
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,6144,16384,2,8,2,1,power_law_1.2,0.666764783859253
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,6144,16384,2,8,2,1,power_law_1.01,1.6062335968017578
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,6144,16384,2,8,2,1,power_law_1.01,1.056768035888672
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,6144,16384,2,8,1,2,power_law_1.2,0.5528704166412354
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,6144,16384,2,8,2,1,balanced,1.5500267346700032
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,6144,16384,2,8,2,1,balanced,1.3237173557281494
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,6144,16384,2,8,2,1,balanced,0.3436373472213745
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,6144,16384,2,8,2,1,power_law_1.2,0.6552383899688721
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,6144,16384,2,8,2,1,power_law_1.01,1.8571647644042968
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,6144,16384,2,8,2,1,power_law_1.01,0.3707456111907959
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,6144,16384,2,8,2,1,power_law_1.01,1.472499179840088
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,6144,16384,2,8,1,2,power_law_1.2,0.6908991813659668
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,6144,16384,2,8,2,1,power_law_1.2,0.6950975894927979
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,6144,16384,2,8,2,1,balanced,2.276357332865397
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,6144,16384,2,8,2,1,balanced,0.35231999556223553
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,6144,16384,2,8,2,1,balanced,1.7401173909505208
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,6144,16384,2,8,2,1,power_law_1.01,0.39509758949279783
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,6144,16384,2,8,2,1,power_law_1.01,2.6204479217529295
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,6144,16384,2,8,2,1,power_law_1.2,0.732755184173584
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,6144,16384,2,8,2,1,power_law_1.01,1.8696191787719727
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,6144,16384,2,8,1,2,power_law_1.2,0.9879360198974609
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,6144,16384,2,8,2,1,balanced,0.35835198561350506
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,6144,16384,2,8,2,1,power_law_1.2,0.7669568061828613
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,6144,16384,2,8,2,1,balanced,3.0393333435058594
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,6144,16384,2,8,2,1,power_law_1.01,0.4087808132171631
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,6144,16384,2,8,1,2,power_law_1.2,1.1527039527893066
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,6144,16384,2,8,2,1,power_law_1.01,2.714137649536133
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,6144,16384,2,8,2,1,power_law_1.01,3.3958145141601563
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,6144,16384,2,8,2,1,balanced,2.534992059071859
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,6144,16384,2,8,2,1,power_law_1.2,0.7995903968811036
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,6144,16384,2,8,2,1,balanced,0.369706670443217
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,6144,16384,2,8,2,1,power_law_1.01,0.47374720573425294
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,6144,16384,2,8,2,1,power_law_1.2,0.8819904327392578
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,6144,16384,2,8,2,1,power_law_1.01,3.5658817291259766
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,6144,16384,2,8,2,1,power_law_1.01,4.995123291015625
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,6144,16384,2,8,2,1,balanced,4.470591862996419
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,6144,16384,2,8,2,1,balanced,0.4057493209838867
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,6144,16384,2,8,2,1,power_law_1.2,0.8834752082824707
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,6144,16384,2,8,1,2,power_law_1.2,1.8471935272216797
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,6144,16384,2,8,2,1,power_law_1.01,0.4688000202178955
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,6144,16384,2,8,2,1,balanced,3.372495969136556
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,6144,16384,2,8,2,1,power_law_1.2,1.0478143692016602
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,6144,16384,2,8,2,1,balanced,0.41735998789469403
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,6144,16384,2,8,2,1,power_law_1.01,5.260774230957031
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,6144,16384,2,8,2,1,power_law_1.01,6.596076965332031
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,6144,16384,2,8,2,1,power_law_1.01,0.4843711853027344
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,6144,16384,2,8,1,2,power_law_1.2,2.288006401062012
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,6144,16384,2,8,2,1,power_law_1.2,1.1910143852233888
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,6144,16384,2,8,2,1,balanced,6.1618296305338545
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,6144,16384,2,8,2,1,balanced,0.4402079979578654
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,6144,16384,2,8,2,1,power_law_1.2,1.5385727882385254
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,6144,16384,2,8,2,1,power_law_1.01,7.177299499511719
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,6144,16384,2,8,2,1,power_law_1.01,0.578272008895874
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,6144,16384,2,8,1,2,power_law_1.2,3.5497535705566405
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,6144,16384,2,8,2,1,power_law_1.01,9.902700805664063
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,6144,16384,2,8,2,1,balanced,0.6869760354359945
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,6144,16384,2,8,2,1,power_law_1.2,1.9238336563110352
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,6144,16384,2,8,2,1,balanced,4.970053354899089
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,6144,16384,2,8,2,1,power_law_1.01,0.7624767780303955
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,6144,16384,2,8,2,1,power_law_1.2,2.603571128845215
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,6144,16384,2,8,2,1,power_law_1.01,8.936294555664062
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,6144,16384,2,8,1,2,power_law_1.2,4.560537719726563
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,6144,16384,2,8,2,1,balanced,0.7416959603627523
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,6144,16384,2,8,2,1,balanced,9.07098134358724
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,6144,16384,2,8,2,1,power_law_1.2,3.3280704498291014
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,6144,16384,2,8,2,1,power_law_1.01,0.9296832084655762
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,6144,16384,2,8,2,1,power_law_1.01,13.100544738769532
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,6144,16384,2,8,2,1,balanced,1.1211093266805012
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,6144,16384,2,8,1,2,power_law_1.2,7.199110412597657
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,6144,16384,2,8,2,1,power_law_1.2,4.850304031372071
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,6144,16384,2,8,2,1,power_law_1.01,1.3003199577331543
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,6144,16384,2,8,2,1,balanced,6.931973139444987
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,6144,16384,2,8,2,1,power_law_1.01,14.12794189453125
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,6144,16384,2,8,2,1,balanced,1.4928693771362305
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,6144,16384,2,8,2,1,power_law_1.2,6.564012908935547
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,6144,16384,2,8,2,1,power_law_1.01,1.681817626953125
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,6144,16384,2,8,1,2,power_law_1.2,9.927385711669922
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,6144,16384,2,8,2,1,balanced,12.565600077311197
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,6144,16384,2,8,2,1,power_law_1.01,16.236172485351563
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,6144,16384,2,8,2,1,balanced,2.230485280354818
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,6144,16384,2,8,2,1,power_law_1.01,2.4001535415649413
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,6144,16384,2,8,2,1,power_law_1.2,9.938706970214843
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,6144,16384,2,8,2,1,power_law_1.01,27.85047607421875
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,6144,16384,2,8,1,2,power_law_1.2,15.720684814453126
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,6144,16384,2,8,2,1,power_law_1.01,3.1118335723876953
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,6144,16384,2,8,2,1,balanced,8.757781346638998
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,6144,16384,2,8,2,1,balanced,2.9691734313964844
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,6144,16384,2,8,2,1,power_law_1.2,13.008274841308594
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,6144,16384,2,8,2,1,power_law_1.01,4.581862258911133
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,6144,16384,2,8,2,1,power_law_1.01,25.494496154785157
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,6144,16384,2,8,2,1,balanced,15.809071858723959
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,6144,16384,2,8,2,1,balanced,4.4302934010823565
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,6144,16384,2,8,1,2,power_law_1.2,18.264569091796876
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,6144,16384,2,8,2,1,power_law_1.2,16.29443817138672
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,6144,16384,2,8,2,1,power_law_1.01,6.011667251586914
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,6144,16384,2,8,2,1,balanced,5.932053248087565
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,6144,16384,2,8,2,1,power_law_1.01,9.032300567626953
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,6144,16384,2,8,1,2,power_law_1.2,26.38560791015625
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,6144,16384,2,8,2,1,balanced,14.076224009195963
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,6144,16384,2,8,2,1,power_law_1.2,25.56513214111328
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,6144,16384,2,8,2,1,power_law_1.01,50.497528076171875
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,6144,16384,2,8,2,1,power_law_1.01,12.116140747070313
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,6144,16384,2,8,2,1,balanced,8.931957244873047
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,6144,16384,2,8,2,1,balanced,24.645716349283855
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,6144,16384,2,8,2,1,power_law_1.01,14.99120635986328
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,6144,16384,2,8,2,1,power_law_1.2,50.55757446289063
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,6144,16384,2,8,1,2,power_law_1.2,45.642214965820315
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,6144,16384,2,8,2,1,balanced,12.033397674560547
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,6144,16384,2,8,2,1,power_law_1.01,25.529997253417967
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,6144,16384,2,8,2,1,balanced,27.8101069132487
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,6144,16384,2,8,2,1,balanced,15.28121566772461
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,6144,16384,2,8,2,1,power_law_1.01,53.44138793945312
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,6144,16384,2,8,1,2,power_law_1.2,97.54098510742188
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,6144,16384,2,8,2,1,balanced,49.74101765950521
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,6144,16384,2,8,2,1,balanced,25.72687530517578
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,6144,16384,2,8,2,1,balanced,54.806365966796875
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,6144,16384,2,8,2,1,power_law_1.2,0.1115455985069275
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,6144,16384,2,8,2,1,power_law_1.2,0.1316864013671875
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,6144,16384,2,8,2,1,power_law_1.2,0.1766975998878479
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,6144,16384,2,8,2,1,power_law_1.2,0.30423679351806643
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,6144,16384,2,8,2,1,power_law_1.2,0.3131135940551758
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,6144,16384,2,8,2,1,power_law_1.2,0.32330880165100095
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,6144,16384,2,8,2,1,power_law_1.2,0.34498560428619385
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,6144,16384,2,8,2,1,power_law_1.2,0.3387264013290405
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,6144,16384,2,8,2,1,power_law_1.2,0.35256319046020507
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,6144,16384,2,8,2,1,power_law_1.2,0.10671360492706299
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,6144,16384,2,8,2,1,power_law_1.2,0.364518404006958
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,6144,16384,2,8,2,1,power_law_1.2,0.12319359779357911
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,6144,16384,2,8,2,1,power_law_1.2,0.3545471906661987
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,6144,16384,2,8,2,1,power_law_1.2,0.2041408061981201
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,6144,16384,2,8,2,1,power_law_1.2,0.2989567995071411
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,6144,16384,2,8,2,1,power_law_1.2,0.3847615957260132
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,6144,16384,2,8,2,1,power_law_1.2,0.3067712068557739
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,6144,16384,2,8,2,1,power_law_1.2,0.38061439990997314
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,6144,16384,2,8,2,1,power_law_1.2,0.34279680252075195
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,6144,16384,2,8,2,1,power_law_1.2,0.39797120094299315
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,6144,16384,2,8,2,1,power_law_1.2,0.43471999168395997
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,6144,16384,2,8,2,1,power_law_1.2,0.38103680610656737
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,6144,16384,2,8,2,1,power_law_1.2,0.4426432132720947
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,6144,16384,2,8,2,1,power_law_1.2,0.40612478256225587
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,6144,16384,2,8,2,1,power_law_1.2,0.4873343944549561
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,6144,16384,2,8,2,1,power_law_1.2,0.5895743846893311
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,6144,16384,2,8,2,1,power_law_1.2,0.6413375854492187
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,6144,16384,2,8,2,1,power_law_1.2,0.3847487926483154
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,6144,16384,2,8,2,1,power_law_1.2,0.886086368560791
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,6144,16384,2,8,2,1,power_law_1.2,0.39296000003814696
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,6144,16384,2,8,2,1,power_law_1.2,1.0461055755615234
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,6144,16384,2,8,2,1,power_law_1.2,1.4935680389404298
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,6144,16384,2,8,2,1,power_law_1.2,1.8691135406494142
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,6144,16384,2,8,2,1,power_law_1.2,0.3678783893585205
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,6144,16384,2,8,2,1,power_law_1.2,2.649740791320801
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,6144,16384,2,8,2,1,power_law_1.2,0.4020864009857178
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,7168,2048,8,256,1,2,balanced,0.13166399796803793
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,6144,16384,2,8,2,1,power_law_1.2,3.5368320465087892
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,6144,16384,2,8,2,1,power_law_1.2,0.4067071914672852
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,6144,16384,2,8,2,1,power_law_1.2,5.279999923706055
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,7168,2048,8,256,1,2,balanced,0.19951466719309488
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,6144,16384,2,8,2,1,power_law_1.2,0.48360958099365237
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,7168,2048,8,256,1,2,balanced,0.3575146595637004
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,6144,16384,2,8,2,1,power_law_1.2,0.4840832233428955
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,7168,2048,8,256,1,2,balanced,0.0881173312664032
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,6144,16384,2,8,2,1,power_law_1.2,7.136370849609375
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,7168,2048,8,256,1,2,balanced,0.685920000076294
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,6144,16384,2,8,2,1,power_law_1.2,0.5026303768157959
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,7168,2048,8,256,1,2,balanced,0.12441600362459819
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,6144,16384,2,8,2,1,power_law_1.2,0.5796031951904297
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,6144,16384,2,8,2,1,power_law_1.2,8.834425354003907
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,7168,2048,8,256,1,2,balanced,1.3260746796925862
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,7168,2048,8,256,1,2,balanced,0.20605866114298502
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,6144,16384,2,8,2,1,power_law_1.2,0.7589375972747803
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,7168,2048,8,256,1,2,balanced,2.605445384979248
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,7168,2048,8,256,1,2,balanced,0.3691466649373372
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,6144,16384,2,8,2,1,power_law_1.2,0.9264896392822266
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,6144,16384,2,8,2,1,power_law_1.2,14.095584106445312
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,7168,2048,8,256,1,2,balanced,2.615488052368164
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,7168,2048,8,256,1,2,balanced,0.6982080141703287
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,6144,16384,2,8,2,1,power_law_1.2,1.311571216583252
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,7168,2048,8,256,1,2,balanced,2.6257707277933755
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,7168,2048,8,256,1,2,balanced,1.3539093335469563
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,6144,16384,2,8,2,1,power_law_1.2,1.6431871414184571
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,7168,2048,8,256,1,2,balanced,2.629535992940267
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,6144,16384,2,8,2,1,power_law_1.2,27.727020263671875
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,7168,2048,8,256,1,2,balanced,1.3581652641296387
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,6144,16384,2,8,2,1,power_law_1.2,2.379360008239746
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,7168,2048,8,256,1,2,balanced,2.639135996500651
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,7168,2048,8,256,1,2,balanced,1.3516160647074382
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,6144,16384,2,8,2,1,power_law_1.2,3.1101184844970704
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,7168,2048,8,256,1,2,balanced,2.6516267458597818
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,7168,2048,8,256,1,2,balanced,1.3508319854736328
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,6144,16384,2,8,2,1,power_law_1.2,4.579724884033203
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,7168,2048,8,256,1,2,balanced,2.638831933339437
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,7168,2048,8,256,1,2,balanced,1.3664746284484863
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,7168,2048,8,256,1,2,balanced,2.659125328063965
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,6144,16384,2,8,2,1,power_law_1.2,6.081958389282226
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,7168,2048,8,256,1,2,balanced,1.3699946403503418
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,7168,2048,8,256,1,2,balanced,2.661440054575602
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,7168,2048,8,256,1,2,balanced,1.3740320205688477
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,6144,16384,2,8,2,1,power_law_1.2,9.025740814208984
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,7168,2048,8,256,1,2,power_law_1.01,0.13258880376815796
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,7168,2048,8,256,1,2,power_law_1.01,0.2227008104324341
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,7168,2048,8,256,1,2,balanced,2.6858132680257163
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,7168,2048,8,256,1,2,balanced,1.3822186787923176
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,6144,16384,2,8,2,1,power_law_1.2,12.133331298828125
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,7168,2048,8,256,1,2,power_law_1.01,0.20320000648498535
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,7168,2048,8,256,1,2,balanced,2.6869068145751953
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,7168,2048,8,256,1,2,power_law_1.01,0.36068480014801024
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,7168,2048,8,256,1,2,balanced,1.394938627878825
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,7168,2048,8,256,1,2,power_law_1.01,0.19445120096206664
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,7168,2048,8,256,1,2,power_law_1.01,0.24917120933532716
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,7168,2048,8,256,1,2,balanced,2.7464799880981445
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,7168,2048,8,256,1,2,balanced,1.3997759819030762
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,6144,16384,2,8,2,1,power_law_1.2,15.36904296875
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,7168,2048,8,256,1,2,power_law_1.01,0.2705280065536499
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,7168,2048,8,256,1,2,power_law_1.01,0.5101568222045898
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,7168,2048,8,256,1,2,balanced,1.4114185969034831
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,7168,2048,8,256,1,2,balanced,2.795978546142578
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,7168,2048,8,256,1,2,power_law_1.01,0.48009600639343264
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,7168,2048,8,256,1,2,power_law_1.01,0.9077568054199219
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,7168,2048,8,256,1,2,balanced,0.1086079974969228
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,7168,2048,8,256,1,2,balanced,1.4477492968241374
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,6144,16384,2,8,2,1,power_law_1.2,25.356480407714844
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,7168,2048,8,256,1,2,balanced,2.8709065119425454
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,7168,2048,8,256,1,2,power_law_1.01,0.16649600267410278
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,7168,2048,8,256,1,2,power_law_1.01,0.6537536144256592
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,7168,2048,8,256,1,2,balanced,0.1415786643822988
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,7168,2048,8,256,1,2,power_law_1.01,1.2577919960021973
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,7168,2048,8,256,1,2,balanced,1.4855573972066243
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,7168,2048,8,256,1,2,power_law_1.01,0.23836801052093506
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,7168,2048,8,256,1,2,balanced,0.23523734013239542
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,7168,2048,8,256,1,2,power_law_1.01,0.9377984046936035
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,7168,2048,8,256,1,2,balanced,2.96180788675944
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,7168,2048,8,256,1,2,power_law_1.01,1.7987775802612305
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,7168,2048,8,256,1,2,balanced,0.4009759823481242
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,7168,2048,8,256,1,2,power_law_1.01,0.1863103985786438
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,7168,2048,8,256,1,2,balanced,1.5232373873392742
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,7168,2048,8,256,1,2,balanced,0.7135679721832275
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,7168,2048,8,256,1,2,power_law_1.01,0.9550975799560547
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,7168,2048,8,256,1,2,power_law_1.01,1.8596223831176757
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,7168,2048,8,256,1,2,power_law_1.01,0.3291327953338623
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,7168,2048,8,256,1,2,balanced,3.1135946909586587
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,7168,2048,8,256,1,2,balanced,1.3564799626668294
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,6144,16384,2,8,2,1,power_law_1.2,52.50350341796875
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,7168,2048,8,256,1,2,power_law_1.01,1.0467776298522948
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,7168,2048,8,256,1,2,balanced,1.5965065956115723
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,7168,2048,8,256,1,2,power_law_1.01,1.9954111099243164
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,7168,2048,8,256,1,2,balanced,1.363957405090332
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,7168,2048,8,256,1,2,power_law_1.01,0.5000703811645508
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,7168,2048,8,256,1,2,power_law_1.01,1.0614015579223632
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,7168,2048,8,256,1,2,balanced,1.367461363474528
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,7168,2048,8,256,1,2,power_law_1.01,2.0298751831054687
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,7168,2048,8,256,1,2,power_law_1.01,0.7014463901519775
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,7168,2048,8,256,1,2,balanced,3.2892373402913413
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,7168,2048,8,256,1,2,balanced,1.6996906598409016
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,7168,2048,8,256,1,2,balanced,1.373616059621175
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,7168,2048,8,256,1,2,power_law_1.01,1.0354304313659668
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,7168,2048,8,256,1,2,power_law_1.01,0.9468223571777343
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,7168,2048,8,256,1,2,power_law_1.01,2.138476753234863
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,7168,2048,8,256,1,2,balanced,1.377903938293457
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,7168,2048,8,256,1,2,power_law_1.01,0.9668416023254395
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,7168,2048,8,256,1,2,power_law_1.01,1.192300796508789
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,7168,2048,8,256,1,2,balanced,1.3868160247802734
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,7168,2048,8,256,1,2,power_law_1.01,2.1756479263305666
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,7168,2048,8,256,1,2,balanced,1.8211199442545574
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,7168,2048,8,256,1,2,balanced,3.40283203125
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,7168,2048,8,256,1,2,power_law_1.01,0.9998720169067383
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,7168,2048,8,256,1,2,balanced,1.3998719851175945
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,7168,2048,8,256,1,2,power_law_1.01,1.2012224197387695
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,7168,2048,8,256,1,2,power_law_1.01,2.2105344772338866
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,7168,2048,8,256,1,2,balanced,1.4107413291931152
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,7168,2048,8,256,1,2,power_law_1.01,1.087334442138672
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,7168,2048,8,256,1,2,power_law_1.01,1.205235195159912
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,7168,2048,8,256,1,2,balanced,1.4234719276428223
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,7168,2048,8,256,1,2,power_law_1.01,2.248134422302246
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,7168,2048,8,256,1,2,balanced,1.9586346944173176
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,7168,2048,8,256,1,2,power_law_1.01,1.1765760421752929
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,7168,2048,8,256,1,2,power_law_1.01,1.2623167991638184
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,7168,2048,8,256,1,2,balanced,1.4485653241475422
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,7168,2048,8,256,1,2,power_law_1.01,1.1948863983154296
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,7168,2048,8,256,1,2,balanced,4.294421195983887
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,7168,2048,8,256,1,2,power_law_1.01,2.3505151748657225
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,7168,2048,8,256,1,2,power_law_1.01,1.3270719528198243
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,7168,2048,8,256,1,2,balanced,1.4667359987894695
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,7168,2048,8,256,1,2,power_law_1.01,1.262502384185791
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,7168,2048,8,256,1,2,power_law_1.01,2.376947212219238
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,7168,2048,8,256,1,2,power_law_1.01,1.4333312034606933
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,7168,2048,8,256,1,2,power_law_1.01,1.405401611328125
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,7168,2048,8,256,1,2,balanced,1.5115359624226887
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,7168,2048,8,256,1,2,balanced,2.6670185724894204
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,7168,2048,8,256,1,2,power_law_1.01,2.606048011779785
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,7168,2048,8,256,1,2,power_law_1.01,1.526848030090332
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,7168,2048,8,256,1,2,power_law_1.01,1.6567935943603516
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,7168,2048,8,256,1,2,power_law_1.01,1.6516992568969726
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,7168,2048,8,256,1,2,power_law_1.01,2.891379165649414
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,7168,2048,8,256,1,2,power_law_1.01,1.6181760787963868
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,7168,2048,8,256,1,2,balanced,4.625328063964844
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,7168,2048,8,256,1,2,power_law_1.01,1.8761280059814454
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,7168,2048,8,256,1,2,power_law_1.01,3.0100799560546876
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,7168,2048,8,256,1,2,power_law_1.01,1.9034624099731445
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,7168,2048,8,256,1,2,balanced,2.867157300313314
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,7168,2048,8,256,1,2,balanced,1.6176479657491047
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,7168,2048,8,256,1,2,power_law_1.01,3.3946304321289062
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,7168,2048,8,256,1,2,power_law_1.01,1.8109376907348633
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,7168,2048,8,256,1,2,power_law_1.01,1.9619712829589844
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,7168,2048,8,256,1,2,power_law_1.01,2.1238847732543946
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,7168,2048,8,256,1,2,power_law_1.01,3.293958282470703
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,7168,2048,8,256,1,2,power_law_1.01,2.430751991271973
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,7168,2048,8,256,1,2,power_law_1.01,3.7072128295898437
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,7168,2048,8,256,1,2,balanced,6.314069112141927
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,7168,2048,8,256,1,2,power_law_1.01,3.027737617492676
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,7168,2048,8,256,1,2,power_law_1.01,4.236735916137695
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,7168,2048,8,256,1,2,power_law_1.01,3.751814270019531
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,7168,2048,8,256,1,2,balanced,3.9973119099934897
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,7168,2048,8,256,1,2,power_law_1.01,5.397721481323242
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,256,1,2,balanced,1.7175466219584148
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,7168,2048,8,256,1,2,power_law_1.01,5.069222259521484
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,256,1,2,power_law_1.01,1.822265625
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,7168,2048,8,256,1,2,power_law_1.01,6.4737091064453125
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,256,1,2,balanced,1.892837365468343
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,7168,2048,8,256,1,2,power_law_1.01,6.667667388916016
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,256,1,2,power_law_1.01,2.2170944213867188
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,7168,2048,8,256,1,2,power_law_1.01,8.5604736328125
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,256,1,2,power_law_1.01,2.7126911163330076
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,7168,2048,8,256,1,2,power_law_1.01,7.988716888427734
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,256,1,2,balanced,2.0547520319620767
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,256,1,2,power_law_1.01,3.0057279586791994
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,7168,2048,8,256,1,2,power_law_1.01,10.883103942871093
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,7168,2048,8,256,1,2,balanced,8.321114857991537
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,256,1,2,power_law_1.01,3.9260478973388673
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,7168,2048,8,256,1,2,power_law_1.01,11.664466857910156
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,256,1,2,balanced,2.545642693837484
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,7168,2048,8,256,1,2,power_law_1.01,13.288896179199218
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,256,1,2,power_law_1.01,4.978630447387696
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,7168,2048,8,256,1,2,balanced,5.263039906819661
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,256,1,2,power_law_1.01,6.302233505249023
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,256,1,2,balanced,2.7973759969075522
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,7168,2048,8,256,1,2,power_law_1.01,23.202496337890626
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,7168,2048,8,256,1,2,power_law_1.01,19.540864562988283
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,256,1,2,power_law_1.01,9.202003479003906
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,256,1,2,power_law_1.01,12.490425872802735
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,256,1,2,balanced,4.47161070505778
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,7168,2048,8,256,1,2,power_law_1.01,37.69350891113281
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,256,1,2,power_law_1.01,15.250822448730469
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,7168,2048,8,256,1,2,balanced,10.374165217081705
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,7168,2048,8,256,1,2,balanced,6.5408477783203125
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,256,1,2,power_law_1.01,23.945849609375
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,256,1,2,balanced,5.19378662109375
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,256,1,2,power_law_1.01,49.19361267089844
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,256,1,2,balanced,7.706122716267903
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,7168,2048,8,256,1,2,balanced,16.512704213460285
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,7168,2048,8,256,1,2,balanced,10.17142422993978
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,256,1,2,balanced,10.589301427205404
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,7168,2048,8,256,1,2,power_law_1.2,0.2207808017730713
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,256,1,2,balanced,13.168394724527994
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,7168,2048,8,256,1,2,power_law_1.2,0.35354878902435305
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,7168,2048,8,256,1,2,power_law_1.2,0.25764479637146
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,7168,2048,8,256,1,2,power_law_1.2,0.52609281539917
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,7168,2048,8,256,1,2,power_law_1.2,0.7307007789611817
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,7168,2048,8,256,1,2,power_law_1.2,1.1621376037597657
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,7168,2048,8,256,1,2,power_law_1.2,1.789779281616211
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,7168,2048,8,256,1,2,power_law_1.2,1.8959871292114259
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,7168,2048,8,256,1,2,power_law_1.2,1.988083267211914
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,7168,2048,8,256,1,2,power_law_1.2,2.0215103149414064
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,7168,2048,8,256,1,2,power_law_1.2,2.0872896194458006
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,7168,2048,8,256,1,2,power_law_1.2,2.2687103271484377
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,7168,2048,8,256,1,2,power_law_1.2,0.1323904037475586
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,7168,2048,8,256,1,2,power_law_1.2,2.2228416442871093
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,256,1,2,balanced,21.84051767985026
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,7168,2048,8,256,1,2,power_law_1.2,0.203385591506958
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,7168,2048,8,256,1,2,power_law_1.2,2.376006317138672
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,7168,2048,8,256,1,2,power_law_1.2,0.15262080430984498
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,7168,2048,8,256,1,2,power_law_1.2,2.397881507873535
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,7168,2048,8,256,1,2,balanced,19.970650990804035
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,7168,2048,8,256,1,2,power_law_1.2,0.28641281127929685
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,7168,2048,8,256,1,2,power_law_1.2,2.572697639465332
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,7168,2048,8,256,1,2,balanced,32.064361572265625
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,7168,2048,8,256,1,2,power_law_1.2,0.42325119972229003
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,7168,2048,8,256,1,2,power_law_1.2,2.5897279739379884
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,7168,2048,8,256,1,2,power_law_1.2,0.5854527950286865
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,7168,2048,8,256,1,2,power_law_1.2,3.092710494995117
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,7168,2048,8,256,1,2,power_law_1.2,0.9312383651733398
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,7168,2048,8,256,1,2,power_law_1.2,3.346553421020508
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,7168,2048,8,256,1,2,power_law_1.2,0.9550975799560547
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,7168,2048,8,256,1,2,power_law_1.2,3.813702392578125
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,7168,2048,8,256,1,2,power_law_1.2,1.010540771484375
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,7168,2048,8,256,1,2,power_law_1.2,3.439731216430664
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,7168,2048,8,256,1,2,power_law_1.2,1.0395008087158204
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,7168,2048,8,256,1,2,power_law_1.2,4.134451293945313
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,7168,2048,8,256,1,2,power_law_1.2,1.1033344268798828
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,7168,2048,8,256,1,2,power_law_1.2,4.685843276977539
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,7168,2048,8,256,1,2,power_law_1.2,1.119974422454834
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,7168,2048,8,256,1,2,power_law_1.2,1.2491007804870606
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,7168,2048,8,256,1,2,power_law_1.2,5.623904037475586
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,7168,2048,8,256,1,2,power_law_1.2,1.258944034576416
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,7168,2048,8,256,1,2,power_law_1.2,1.2844415664672852
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,7168,2048,8,256,1,2,power_law_1.2,6.9077507019042965
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,7168,2048,8,256,1,2,power_law_1.2,1.371180820465088
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,7168,2048,8,256,1,2,power_law_1.2,1.5097920417785644
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,7168,2048,8,256,1,2,power_law_1.2,9.963072204589844
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,7168,2048,8,256,1,2,power_law_1.2,1.76812801361084
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,7168,2048,8,256,1,2,power_law_1.2,12.226771545410156
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,7168,2048,8,256,1,2,power_law_1.2,1.7853376388549804
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,7168,2048,8,256,1,2,power_law_1.2,2.0596288681030273
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,7168,2048,8,256,1,2,power_law_1.2,1.9269567489624024
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,7168,2048,8,256,1,2,power_law_1.2,14.407072448730469
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,7168,2048,8,256,1,2,power_law_1.2,2.258540725708008
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,256,1,2,balanced,44.5330556233724
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,7168,2048,8,256,1,2,power_law_1.2,2.5089216232299805
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,7168,2048,8,256,1,2,power_law_1.2,20.937266540527343
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,7168,2048,8,256,1,2,power_law_1.2,3.511404800415039
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,7168,2048,8,256,1,2,power_law_1.2,4.075283050537109
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,7168,2048,8,256,1,2,power_law_1.2,38.414309692382815
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,7168,2048,8,256,1,2,power_law_1.2,5.504371261596679
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,7168,2048,8,256,1,2,power_law_1.2,0.15714559555053711
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,7168,2048,8,256,1,2,power_law_1.2,6.984025573730468
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,7168,2048,8,256,1,2,power_law_1.2,0.23662080764770507
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,7168,2048,8,256,1,2,power_law_1.2,8.184544372558594
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,7168,2048,8,256,1,2,power_law_1.2,0.1683135986328125
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,7168,2048,8,256,2,1,balanced,0.13528000315030417
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,7168,2048,8,256,1,2,power_law_1.2,0.2936320066452026
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,7168,2048,8,256,1,2,power_law_1.2,12.380095672607421
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,7168,2048,8,256,2,1,balanced,0.20279467105865479
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,7168,2048,8,256,1,2,power_law_1.2,0.4306496143341064
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,7168,2048,8,256,2,1,balanced,0.3636480172475179
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,7168,2048,8,256,1,2,power_law_1.2,0.5721663951873779
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,7168,2048,8,256,2,1,balanced,0.6945652961730957
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,7168,2048,8,256,1,2,power_law_1.2,22.814105224609374
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,7168,2048,8,256,1,2,power_law_1.2,0.919865608215332
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,7168,2048,8,256,2,1,balanced,1.3513493537902832
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,7168,2048,8,256,1,2,power_law_1.2,1.0150464057922364
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,7168,2048,8,256,2,1,balanced,2.6138025919596353
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,7168,2048,8,256,1,2,power_law_1.2,1.069593620300293
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,7168,2048,8,256,2,1,balanced,2.6286346117655435
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,7168,2048,8,256,2,1,balanced,0.08974400162696838
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,7168,2048,8,256,1,2,power_law_1.2,1.0445823669433594
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,7168,2048,8,256,2,1,balanced,2.6246827443440757
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,7168,2048,8,256,2,1,balanced,0.1254026691118876
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,7168,2048,8,256,1,2,power_law_1.2,1.126137638092041
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,7168,2048,8,256,2,1,balanced,2.62829860051473
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,7168,2048,8,256,2,1,balanced,0.20660799741744995
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,7168,2048,8,256,1,2,power_law_1.2,1.266988754272461
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,7168,2048,8,256,2,1,balanced,2.642517407735189
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,7168,2048,8,256,2,1,balanced,0.374783992767334
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,7168,2048,8,256,1,2,power_law_1.2,1.3356160163879394
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,7168,2048,8,256,2,1,balanced,2.647541364034017
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,7168,2048,8,256,2,1,balanced,0.7092479864756266
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,7168,2048,8,256,1,2,power_law_1.2,1.423040008544922
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,7168,2048,8,256,2,1,balanced,2.664127985636393
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,7168,2048,8,256,2,1,balanced,1.3605653444925945
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,7168,2048,8,256,1,2,power_law_1.2,1.563366413116455
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,7168,2048,8,256,2,1,balanced,1.3604319890340169
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,7168,2048,8,256,2,1,balanced,2.6849120457967124
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,7168,2048,8,256,2,1,balanced,1.3594506581624348
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,7168,2048,8,256,1,2,power_law_1.2,1.6718015670776367
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,7168,2048,8,256,2,1,balanced,2.693999926249186
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,7168,2048,8,256,2,1,balanced,1.3695039749145508
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,7168,2048,8,256,2,1,balanced,2.7135146458943686
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,7168,2048,8,256,1,2,power_law_1.2,1.9746688842773437
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,7168,2048,8,256,2,1,balanced,1.3708213170369465
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,7168,2048,8,256,2,1,balanced,2.7271254857381186
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,7168,2048,8,256,2,1,balanced,1.387114683787028
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,7168,2048,8,256,2,1,balanced,2.757434527079264
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,7168,2048,8,256,1,2,power_law_1.2,2.0610240936279296
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,7168,2048,8,256,2,1,balanced,1.4141759872436523
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,7168,2048,8,256,2,1,balanced,2.909520149230957
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,7168,2048,8,256,2,1,balanced,1.4372266133626301
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,7168,2048,8,256,2,1,balanced,1.4477440516153972
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,7168,2048,8,256,2,1,balanced,2.959530512491862
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,256,1,2,power_law_1.2,1.987411117553711
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,7168,2048,8,256,2,1,balanced,1.4566720326741536
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,256,1,2,power_law_1.2,2.3591808319091796
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,7168,2048,8,256,2,1,balanced,3.0357494354248047
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,7168,2048,8,256,2,1,balanced,1.4673706690470378
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,256,1,2,power_law_1.2,2.7147199630737306
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,7168,2048,8,256,2,1,balanced,1.499381383260091
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,7168,2048,8,256,2,1,balanced,3.250783920288086
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,256,1,2,power_law_1.2,3.1801664352416994
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,7168,2048,8,256,2,1,balanced,1.5411307017008464
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,256,1,2,power_law_1.2,3.76890869140625
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,7168,2048,8,256,2,1,balanced,3.510239919026693
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,7168,2048,8,256,2,1,balanced,1.6360373497009277
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,256,1,2,power_law_1.2,5.662271881103516
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,7168,2048,8,256,2,1,balanced,1.7368052800496419
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,7168,2048,8,256,2,1,balanced,3.743743896484375
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,256,1,2,power_law_1.2,6.511315155029297
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,7168,2048,8,256,2,1,balanced,1.8558346430460613
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,256,1,2,power_law_1.2,9.298035430908204
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,7168,2048,8,256,2,1,balanced,2.082640012105306
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,7168,2048,8,256,2,1,balanced,4.828367869059245
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,256,1,2,power_law_1.2,12.046144104003906
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,7168,2048,8,256,2,1,balanced,2.320682684580485
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,256,1,2,power_law_1.2,15.012428283691406
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,7168,2048,8,256,2,1,balanced,5.334933598836263
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,7168,2048,8,256,2,1,balanced,3.1302293141682944
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,256,1,2,power_law_1.2,25.4450439453125
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,7168,2048,8,256,2,1,balanced,3.5798772176106772
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,7168,2048,8,256,2,1,balanced,7.370645523071289
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,7168,2048,8,256,2,1,power_law_1.01,0.13390719890594482
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,256,1,2,power_law_1.2,51.85732421875
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,7168,2048,8,256,2,1,power_law_1.01,0.20017919540405274
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,7168,2048,8,256,2,1,power_law_1.01,0.26204159259796145
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,7168,2048,8,256,2,1,power_law_1.01,0.5110784053802491
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,7168,2048,8,256,2,1,balanced,5.033029238382976
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,7168,2048,8,256,2,1,power_law_1.01,0.858732795715332
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,7168,2048,8,256,2,1,power_law_1.01,1.1621503829956055
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,7168,2048,8,256,2,1,balanced,0.14314666390419006
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,7168,2048,8,256,2,1,balanced,9.926106770833334
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,7168,2048,8,256,2,1,power_law_1.01,1.7534143447875976
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,7168,2048,8,256,2,1,balanced,0.17845332622528076
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,7168,2048,8,256,2,1,power_law_1.01,1.892582321166992
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,7168,2048,8,256,2,1,balanced,0.2601120074590047
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,7168,2048,8,256,2,1,balanced,0.42220266660054523
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,7168,2048,8,256,2,1,power_law_1.01,1.9647424697875977
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,7168,2048,8,256,2,1,balanced,0.729973316192627
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,7168,2048,8,256,2,1,power_law_1.01,1.9963903427124023
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,7168,2048,8,256,2,1,balanced,1.3840959866841633
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,7168,2048,8,256,2,1,balanced,6.651482899983724
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,7168,2048,8,256,2,1,power_law_1.01,2.0895423889160156
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,7168,2048,8,256,2,1,balanced,1.39246400197347
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,7168,2048,8,256,2,1,balanced,1.4003626505533855
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,7168,2048,8,256,2,1,power_law_1.01,2.164089584350586
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,7168,2048,8,256,2,1,balanced,1.4116479555765789
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,7168,2048,8,256,2,1,power_law_1.01,2.1949567794799805
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,7168,2048,8,256,2,1,balanced,1.4120052655537922
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,7168,2048,8,256,2,1,balanced,11.749071756998697
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,7168,2048,8,256,2,1,balanced,1.435215950012207
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,7168,2048,8,256,2,1,power_law_1.01,2.282054328918457
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,7168,2048,8,256,2,1,balanced,1.453887939453125
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,7168,2048,8,256,2,1,power_law_1.01,2.356096076965332
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,7168,2048,8,256,2,1,balanced,1.4693652788798015
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,7168,2048,8,256,2,1,power_law_1.01,2.427168083190918
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,7168,2048,8,256,2,1,balanced,1.5047039985656738
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,7168,2048,8,256,2,1,power_law_1.01,2.601408004760742
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,7168,2048,8,256,2,1,balanced,1.550821304321289
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,7168,2048,8,256,2,1,balanced,8.127066930135092
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,7168,2048,8,256,2,1,power_law_1.01,0.08452479839324951
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,7168,2048,8,256,2,1,balanced,1.5899732907613118
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,7168,2048,8,256,2,1,power_law_1.01,2.805574417114258
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,7168,2048,8,256,2,1,power_law_1.01,3.149932861328125
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,7168,2048,8,256,2,1,power_law_1.01,0.12391680479049683
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,7168,2048,8,256,2,1,balanced,1.660362720489502
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,7168,2048,8,256,2,1,power_law_1.01,0.14395519495010375
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,7168,2048,8,256,2,1,power_law_1.01,3.7302207946777344
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,7168,2048,8,256,2,1,power_law_1.01,0.2830336093902588
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,7168,2048,8,256,2,1,power_law_1.01,3.242015838623047
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,7168,2048,8,256,2,1,power_law_1.01,0.4654911994934082
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,7168,2048,8,256,2,1,power_law_1.01,3.7143550872802735
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,7168,2048,8,256,2,1,balanced,1.832309405008952
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,7168,2048,8,256,2,1,power_law_1.01,0.623583984375
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,7168,2048,8,256,2,1,power_law_1.01,4.32097282409668
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,7168,2048,8,256,2,1,power_law_1.01,0.9293824195861816
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,7168,2048,8,256,2,1,power_law_1.01,0.9941311836242676
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,7168,2048,8,256,2,1,balanced,20.082005818684895
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,7168,2048,8,256,2,1,power_law_1.01,5.4647167205810545
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,7168,2048,8,256,2,1,power_law_1.01,1.0356863975524901
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,7168,2048,8,256,2,1,power_law_1.01,6.552921295166016
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,7168,2048,8,256,2,1,power_law_1.01,0.1401792049407959
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,7168,2048,8,256,2,1,power_law_1.01,1.0762368202209474
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,7168,2048,8,256,2,1,power_law_1.01,1.0835776329040527
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,7168,2048,8,256,2,1,power_law_1.01,0.18487679958343506
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,7168,2048,8,256,2,1,power_law_1.01,8.900383758544923
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,7168,2048,8,256,2,1,power_law_1.01,1.1394880294799805
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,7168,2048,8,256,2,1,power_law_1.01,0.19185919761657716
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,7168,2048,8,256,2,1,balanced,13.445327758789062
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,256,2,1,balanced,2.0287307103474936
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,7168,2048,8,256,2,1,power_law_1.2,0.13349759578704834
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,7168,2048,8,256,2,1,power_law_1.01,11.50113296508789
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,7168,2048,8,256,2,1,power_law_1.01,1.1773568153381349
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,7168,2048,8,256,2,1,power_law_1.01,0.32817280292510986
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,7168,2048,8,256,2,1,power_law_1.2,0.20094718933105468
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,7168,2048,8,256,2,1,power_law_1.01,1.2662079811096192
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,7168,2048,8,256,2,1,power_law_1.01,0.5128704071044922
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,256,2,1,balanced,2.3378453254699707
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,7168,2048,8,256,2,1,power_law_1.2,0.25719680786132815
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,7168,2048,8,256,2,1,power_law_1.01,14.026284790039062
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,7168,2048,8,256,2,1,power_law_1.01,1.3188480377197265
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,7168,2048,8,256,2,1,power_law_1.01,0.6759488105773925
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,7168,2048,8,256,2,1,power_law_1.2,0.491923189163208
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,256,2,1,balanced,2.555178642272949
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,7168,2048,8,256,2,1,power_law_1.2,0.755673599243164
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,7168,2048,8,256,2,1,power_law_1.01,1.3470848083496094
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,7168,2048,8,256,2,1,power_law_1.01,0.978495979309082
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,7168,2048,8,256,2,1,power_law_1.2,1.013657569885254
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,7168,2048,8,256,2,1,power_law_1.01,20.898912048339845
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,7168,2048,8,256,2,1,power_law_1.01,1.451871967315674
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,7168,2048,8,256,2,1,power_law_1.01,1.0347328186035156
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,7168,2048,8,256,2,1,power_law_1.2,1.6936447143554687
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,256,2,1,balanced,3.368768056233724
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,7168,2048,8,256,2,1,power_law_1.01,1.659846305847168
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,7168,2048,8,256,2,1,power_law_1.2,1.862553596496582
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,7168,2048,8,256,2,1,power_law_1.01,1.0585920333862304
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,7168,2048,8,256,2,1,power_law_1.2,1.9217536926269532
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,7168,2048,8,256,2,1,power_law_1.01,1.6593856811523438
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,7168,2048,8,256,2,1,power_law_1.01,1.1091903686523437
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,7168,2048,8,256,2,1,power_law_1.2,1.9935615539550782
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,7168,2048,8,256,2,1,power_law_1.01,1.9579839706420898
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,7168,2048,8,256,2,1,power_law_1.01,1.1941503524780273
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,7168,2048,8,256,2,1,power_law_1.01,38.232415771484376
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,256,2,1,balanced,3.879157384236654
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,7168,2048,8,256,2,1,power_law_1.2,2.1406784057617188
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,7168,2048,8,256,2,1,power_law_1.01,1.9069311141967773
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,7168,2048,8,256,2,1,power_law_1.2,2.1956480026245115
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,7168,2048,8,256,2,1,power_law_1.01,1.295564842224121
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,7168,2048,8,256,2,1,power_law_1.2,2.299750328063965
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,7168,2048,8,256,2,1,power_law_1.01,2.2631359100341797
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,7168,2048,8,256,2,1,power_law_1.01,1.3417216300964356
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,7168,2048,8,256,2,1,power_law_1.2,2.4031679153442385
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,7168,2048,8,256,2,1,power_law_1.01,2.6278911590576173
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,7168,2048,8,256,2,1,power_law_1.2,2.408844757080078
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,256,2,1,balanced,6.276959737141927
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,7168,2048,8,256,2,1,power_law_1.01,1.4499648094177247
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,7168,2048,8,256,2,1,power_law_1.2,2.557504081726074
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,7168,2048,8,256,2,1,power_law_1.01,3.3985729217529297
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,7168,2048,8,256,2,1,power_law_1.01,1.5656895637512207
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,7168,2048,8,256,2,1,power_law_1.2,2.7434240341186524
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,7168,2048,8,256,2,1,power_law_1.01,1.7030656814575196
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,7168,2048,8,256,2,1,power_law_1.01,4.186272048950196
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,7168,2048,8,256,2,1,power_law_1.2,3.0121984481811523
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,7168,2048,8,256,2,1,power_law_1.2,3.377555084228516
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,7168,2048,8,256,2,1,power_law_1.01,1.9386112213134765
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,7168,2048,8,256,2,1,power_law_1.01,5.7892414093017575
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,256,2,1,balanced,7.387909571329753
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,7168,2048,8,256,2,1,power_law_1.2,3.9737598419189455
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,7168,2048,8,256,2,1,power_law_1.01,7.403929901123047
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,7168,2048,8,256,2,1,power_law_1.2,3.4854721069335937
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,7168,2048,8,256,2,1,power_law_1.01,2.1642431259155273
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,7168,2048,8,256,2,1,power_law_1.2,4.05285758972168
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,7168,2048,8,256,2,1,power_law_1.01,8.959065246582032
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,7168,2048,8,256,2,1,power_law_1.2,4.58166389465332
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,7168,2048,8,256,2,1,balanced,36.64843241373698
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,7168,2048,8,256,2,1,power_law_1.2,5.761376190185547
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,256,2,1,power_law_1.01,2.1107967376708983
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,7168,2048,8,256,2,1,power_law_1.01,14.494355773925781
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,7168,2048,8,256,2,1,power_law_1.2,6.891276550292969
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,256,2,1,power_law_1.01,2.6175615310668947
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,256,2,1,balanced,10.912773132324219
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,7168,2048,8,256,2,1,power_law_1.2,9.28155517578125
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,7168,2048,8,256,2,1,balanced,27.07415008544922
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,256,2,1,power_law_1.01,3.091251182556152
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,7168,2048,8,256,2,1,power_law_1.01,27.599246215820312
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,7168,2048,8,256,2,1,power_law_1.2,12.037728118896485
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,256,2,1,power_law_1.01,3.852115249633789
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,7168,2048,8,256,2,1,power_law_1.2,14.4521728515625
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,256,2,1,power_law_1.01,4.687910461425782
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,256,2,1,power_law_1.01,6.396511840820312
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,7168,2048,8,256,2,1,power_law_1.2,21.22563781738281
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,256,2,1,power_law_1.01,8.141490936279297
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,256,2,1,balanced,14.832735697428385
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,256,2,1,power_law_1.01,11.73797149658203
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,7168,2048,8,256,2,1,power_law_1.2,38.82719421386719
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,256,2,1,power_law_1.01,15.187295532226562
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,256,2,1,power_law_1.01,18.758834838867188
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,256,2,1,power_law_1.01,29.73603210449219
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,256,2,1,balanced,18.353978474934895
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,7168,2048,8,256,2,1,power_law_1.2,0.08488320112228394
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,7168,2048,8,256,2,1,power_law_1.2,0.12355200052261353
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,7168,2048,8,256,2,1,power_law_1.2,0.13997440338134765
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,256,2,1,power_law_1.01,58.85699462890625
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,7168,2048,8,256,2,1,power_law_1.2,0.2640511989593506
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,7168,2048,8,256,2,1,power_law_1.2,0.3905280113220215
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,7168,2048,8,256,2,1,power_law_1.2,0.5444032192230225
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,7168,2048,8,256,2,1,power_law_1.2,0.9137727737426757
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,7168,2048,8,256,2,1,power_law_1.2,0.950278377532959
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,7168,2048,8,256,2,1,power_law_1.2,1.0215871810913086
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,7168,2048,8,256,2,1,power_law_1.2,1.062611198425293
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,7168,2048,8,256,2,1,power_law_1.2,1.0925951957702638
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,256,2,1,balanced,30.652239481608074
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,7168,2048,8,256,2,1,power_law_1.2,1.1497471809387207
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,7168,2048,8,256,2,1,power_law_1.2,1.1778047561645508
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,7168,2048,8,256,2,1,power_law_1.2,1.256447982788086
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,7168,2048,8,256,2,1,power_law_1.2,1.3519935607910156
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,7168,2048,8,256,2,1,power_law_1.2,1.41911039352417
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,7168,2048,8,256,2,1,power_law_1.2,1.5400896072387695
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,7168,2048,8,256,2,1,power_law_1.2,1.6935487747192384
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,7168,2048,8,256,2,1,power_law_1.2,1.771334457397461
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,7168,2048,8,256,2,1,power_law_1.2,2.1170175552368162
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,7168,2048,8,256,2,1,power_law_1.2,2.0062976837158204
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,7168,2048,8,256,2,1,power_law_1.2,2.393951988220215
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,7168,2048,8,256,2,1,power_law_1.2,2.7706111907958983
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,7168,2048,8,256,2,1,power_law_1.2,3.5507839202880858
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,7168,2048,8,256,2,1,power_law_1.2,4.330899047851562
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,7168,2048,8,256,2,1,power_law_1.2,5.928883361816406
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,7168,2048,8,256,2,1,power_law_1.2,7.488972473144531
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,7168,2048,8,256,2,1,power_law_1.2,9.11810531616211
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,7168,2048,8,256,2,1,power_law_1.2,14.898944091796874
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,7168,2048,8,256,2,1,power_law_1.2,27.67799072265625
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,256,2,1,balanced,61.50274658203125
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,7168,2048,8,256,2,1,power_law_1.2,0.14479360580444336
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,7168,2048,8,256,2,1,power_law_1.2,0.1848512053489685
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,7168,2048,8,256,2,1,power_law_1.2,0.19742720127105712
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,2048,768,8,128,1,2,balanced,0.033071999748547874
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,7168,2048,8,256,2,1,power_law_1.2,0.29816958904266355
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,2048,768,8,128,1,2,balanced,0.042725334564844765
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,2048,768,8,128,1,2,balanced,0.06102933486302694
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,7168,2048,8,256,2,1,power_law_1.2,0.4278656005859375
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,2048,768,8,128,1,2,balanced,0.09834667046864827
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,7168,2048,8,256,2,1,power_law_1.2,0.601964807510376
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,2048,768,8,128,1,2,balanced,0.1651573379834493
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,7168,2048,8,256,2,1,power_law_1.2,0.9530367851257324
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,2048,768,8,128,1,2,balanced,0.1673333247502645
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,7168,2048,8,256,2,1,power_law_1.2,1.0200639724731446
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,2048,768,8,128,1,2,balanced,0.16793066263198853
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,2048,768,8,128,1,2,balanced,0.16820265849431357
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,7168,2048,8,256,2,1,power_law_1.2,1.0628735542297363
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,2048,768,8,128,1,2,balanced,0.16916267077128092
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,7168,2048,8,256,2,1,power_law_1.2,1.0707967758178711
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,2048,768,8,128,1,2,balanced,0.17078399658203125
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,2048,768,8,128,1,2,balanced,0.035018667578697205
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,7168,2048,8,256,2,1,power_law_1.2,1.1987071990966798
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,2048,768,8,128,1,2,balanced,0.17153600851694742
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,2048,768,8,128,1,2,balanced,0.03557866563399633
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,2048,768,8,128,1,2,balanced,0.17457600434621176
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,7168,2048,8,256,2,1,power_law_1.2,1.27893123626709
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,2048,768,8,128,1,2,balanced,0.04972266654173533
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,2048,768,8,128,1,2,balanced,0.176581343015035
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,7168,2048,8,256,2,1,power_law_1.2,1.3513471603393554
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,2048,768,8,128,1,2,balanced,0.07042133311430614
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,2048,768,8,128,1,2,balanced,0.1790293256441752
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,7168,2048,8,256,2,1,power_law_1.2,1.4542847633361817
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,2048,768,8,128,1,2,balanced,0.10733333230018616
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,2048,768,8,128,1,2,balanced,0.1889280080795288
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,2048,768,8,128,1,2,balanced,0.10860266288121541
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,7168,2048,8,256,2,1,power_law_1.2,1.6318208694458007
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,2048,768,8,128,1,2,balanced,0.19132266441980997
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,2048,768,8,128,1,2,balanced,0.10833066701889038
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,7168,2048,8,256,2,1,power_law_1.2,1.7903295516967774
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,2048,768,8,128,1,2,balanced,0.19913599888483682
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,2048,768,8,128,1,2,balanced,0.10868799686431885
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,2048,768,8,128,1,2,power_law_1.01,0.040838399529457094
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,2048,768,8,128,1,2,balanced,0.0422026664018631
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,7168,2048,8,256,2,1,power_law_1.2,2.003398323059082
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,2048,768,8,128,1,2,balanced,0.21636799971262613
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,2048,768,8,128,1,2,balanced,0.10981333255767822
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,2048,768,8,128,1,2,power_law_1.01,0.03947519958019256
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,2048,768,8,128,1,2,balanced,0.04472533365090688
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,2048,768,8,128,1,2,balanced,0.23057599862416586
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,2048,768,8,128,1,2,balanced,0.1123306651910146
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,2048,768,8,128,1,2,balanced,0.05221333106358846
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,2048,768,8,128,1,2,power_law_1.01,0.05249279737472534
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,2048,768,8,128,1,2,balanced,0.07166400055090587
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,7168,2048,8,256,2,1,power_law_1.2,2.1907327651977537
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,2048,768,8,128,1,2,balanced,0.11309333642323811
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,2048,768,8,128,1,2,power_law_1.01,0.07585920095443725
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,2048,768,8,128,1,2,balanced,0.2525599996248881
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,2048,768,8,128,1,2,balanced,0.10808533430099487
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,2048,768,8,128,1,2,balanced,0.11657599608103435
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,2048,768,8,128,1,2,power_law_1.01,0.09688959717750549
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,2048,768,8,128,1,2,balanced,0.10944533348083496
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,2048,768,8,128,1,2,balanced,0.27027199665705365
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,2048,768,8,128,1,2,balanced,0.11769066254297893
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,2048,768,8,128,1,2,power_law_1.01,0.1462656021118164
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,256,2,1,power_law_1.2,2.1994943618774414
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,2048,768,8,128,1,2,balanced,0.11030933260917664
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,2048,768,8,128,1,2,balanced,0.12026133139928182
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,2048,768,8,128,1,2,power_law_1.01,0.15110399723052978
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,2048,768,8,128,1,2,balanced,0.11239999532699585
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,2048,768,8,128,1,2,balanced,0.35811201731363934
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,256,2,1,power_law_1.2,2.7119167327880858
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,2048,768,8,128,1,2,balanced,0.1264693339665731
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,2048,768,8,128,1,2,power_law_1.01,0.15360000133514404
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,2048,768,8,128,1,2,balanced,0.1130506694316864
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,256,2,1,power_law_1.2,3.1931455612182615
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,2048,768,8,128,1,2,balanced,0.11552533507347107
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,2048,768,8,128,1,2,power_law_1.01,0.15722880363464356
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,2048,768,8,128,1,2,balanced,0.12868799765904745
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,2048,768,8,128,1,2,balanced,0.3928106625874837
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,2048,768,8,128,1,2,balanced,0.11698133746782939
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,256,2,1,power_law_1.2,3.8928958892822267
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,2048,768,8,128,1,2,power_law_1.01,0.16370559930801393
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,2048,768,8,128,1,2,balanced,0.13980266451835632
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,2048,768,8,128,1,2,power_law_1.01,0.0369024008512497
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,2048,768,8,128,1,2,balanced,0.12079466382662456
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,2048,768,8,128,1,2,power_law_1.01,0.16874879598617554
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,256,2,1,power_law_1.2,4.750175857543946
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,2048,768,8,128,1,2,balanced,0.15437333782513937
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,2048,768,8,128,1,2,balanced,0.12446399529774983
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,2048,768,8,128,1,2,power_law_1.01,0.036313599348068236
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,2048,768,8,128,1,2,power_law_1.01,0.1770560026168823
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,2048,768,8,128,1,2,balanced,0.5424906810124716
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,2048,768,8,128,1,2,power_law_1.01,0.04565120041370392
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,2048,768,8,128,1,2,balanced,0.12889599800109863
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,256,2,1,power_law_1.2,6.4737091064453125
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,2048,768,8,128,1,2,balanced,0.17194666465123495
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,2048,768,8,128,1,2,power_law_1.01,0.17955199480056763
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,2048,768,8,128,1,2,power_law_1.01,0.060601598024368285
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,2048,768,8,128,1,2,power_law_1.01,0.06783360242843628
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,2048,768,8,128,1,2,power_law_1.01,0.18198399543762206
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,2048,768,8,128,1,2,balanced,0.19620267550150552
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,256,2,1,power_law_1.2,8.176076507568359
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,2048,768,8,128,1,2,power_law_1.01,0.09300479888916016
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,2048,768,8,128,1,2,power_law_1.01,0.19998719692230224
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,2048,768,8,128,1,2,power_law_1.01,0.09685119986534119
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,2048,768,8,128,1,2,power_law_1.01,0.10391680002212525
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,2048,768,8,128,1,2,balanced,0.6949280103047689
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,256,2,1,power_law_1.2,11.736876678466796
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,2048,768,8,128,1,2,balanced,0.22225600481033325
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,2048,768,8,128,1,2,power_law_1.01,0.20559999942779542
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,2048,768,8,128,1,2,balanced,0.14059199889500937
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,2048,768,8,128,1,2,power_law_1.01,0.10723199844360351
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,2048,768,8,128,1,2,power_law_1.01,0.21931519508361816
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,2048,768,8,128,1,2,power_law_1.01,0.10948480367660522
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,2048,768,8,128,1,2,balanced,0.14337066809336343
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,2048,768,8,128,1,2,power_law_1.01,0.11161600351333618
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,256,2,1,power_law_1.2,15.360255432128906
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,2048,768,8,128,1,2,balanced,0.30958932638168335
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,2048,768,8,128,1,2,power_law_1.01,0.25294721126556396
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,2048,768,8,128,1,2,power_law_1.01,0.11696000099182129
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,2048,768,8,128,1,2,power_law_1.01,0.25167360305786135
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,2048,768,8,128,1,2,power_law_1.01,0.12120959758758545
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,2048,768,8,128,1,2,power_law_1.01,0.1256384015083313
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,256,2,1,power_law_1.2,18.768595886230468
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,2048,768,8,128,1,2,power_law_1.01,0.297542405128479
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,2048,768,8,128,1,2,balanced,0.3596426645914714
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,2048,768,8,128,1,2,power_law_1.01,0.1326143980026245
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,2048,768,8,128,1,2,balanced,1.017242670059204
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,2048,768,8,128,1,2,power_law_1.01,0.33368959426879885
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,2048,768,8,128,1,2,power_law_1.01,0.14045439958572387
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,2048,768,8,128,1,2,power_law_1.01,0.14618879556655884
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,2048,768,8,128,1,2,power_law_1.01,0.416864013671875
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,2048,768,8,128,1,2,balanced,0.16376533110936484
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,2048,768,8,128,1,2,power_law_1.01,0.17503360509872437
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,256,2,1,power_law_1.2,29.62913818359375
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,2048,768,8,128,1,2,power_law_1.01,0.5034431934356689
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,2048,768,8,128,1,2,power_law_1.01,0.19765119552612304
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,2048,768,8,128,1,2,balanced,0.515999992688497
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,2048,768,8,128,1,2,balanced,0.1896373430887858
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,2048,768,8,128,1,2,power_law_1.01,0.6874239921569825
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,2048,768,8,128,1,2,power_law_1.01,0.23383040428161622
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,2048,768,8,128,1,2,power_law_1.01,0.2775935888290405
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,2048,768,8,128,1,2,balanced,0.20284799734751383
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,2048,768,8,128,1,2,power_law_1.01,0.845580768585205
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,2048,768,8,128,1,2,power_law_1.01,0.3409343957901001
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,2048,768,8,128,1,2,power_law_1.01,1.141983985900879
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,2048,768,8,128,1,2,power_law_1.01,0.44106879234313967
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,2048,768,8,128,1,2,balanced,0.2739466627438863
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,2048,768,8,128,1,2,power_law_1.01,0.6058623790740967
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,2048,768,8,128,1,2,power_law_1.01,1.4920063972473145
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,2048,768,8,128,1,2,balanced,0.6722186406453451
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,2048,768,8,128,1,2,balanced,1.332645336786906
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,256,2,1,power_law_1.2,58.46151123046875
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,2048,768,8,128,1,2,power_law_1.01,0.7579264163970947
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,2048,768,8,128,1,2,balanced,0.32265599568684894
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,2048,768,8,128,1,2,power_law_1.01,1.8921791076660157
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,2048,768,8,128,1,2,power_law_1.01,1.0538816452026367
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,2048,768,8,128,1,2,power_law_1.01,1.4154239654541017
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,2048,768,8,128,1,2,power_law_1.01,2.9235071182250976
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,2048,768,8,128,1,2,balanced,0.4943786859512329
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,2048,768,8,128,1,2,power_law_1.01,1.7283712387084962
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,2048,768,8,128,1,2,power_law_1.01,2.764723205566406
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,2048,768,8,128,1,2,power_law_1.01,6.0561279296875
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,2048,768,8,128,1,2,balanced,0.5924266576766968
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,2048,768,8,128,1,2,balanced,0.9811946551005045
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,2048,768,8,128,1,2,power_law_1.01,5.537503814697265
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,2048,768,8,128,1,2,balanced,1.6512746810913086
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,2048,768,8,128,1,2,balanced,0.8624746799468994
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,2048,768,8,128,1,2,balanced,1.1300266583760579
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,2048,768,8,128,1,2,balanced,1.3019039630889893
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,2048,768,8,128,1,2,balanced,1.6459520657857258
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,2048,768,8,128,1,2,balanced,2.580495993296305
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,2048,768,8,128,1,2,balanced,1.6099200248718262
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,2048,768,8,128,1,2,power_law_1.01,0.040428799390792844
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,2048,768,8,128,1,2,balanced,2.1862133344014487
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,2048,768,8,128,1,2,power_law_1.01,0.04672000110149384
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,2048,768,8,128,1,2,power_law_1.01,0.05056639909744263
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,2048,768,8,128,1,2,power_law_1.01,0.06305279731750488
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,2048,768,8,128,1,2,power_law_1.2,0.041075199842453
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,2048,768,8,128,1,2,power_law_1.01,0.07412480115890503
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,2048,768,8,128,1,2,power_law_1.2,0.037894400954246524
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,2048,768,8,128,1,2,power_law_1.01,0.09874560236930847
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,2048,768,8,128,1,2,power_law_1.2,0.04741120040416717
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,2048,768,8,128,1,2,power_law_1.01,0.10495359897613525
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,2048,768,8,128,1,2,power_law_1.2,0.06812800168991089
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,2048,768,8,128,1,2,power_law_1.01,0.10696959495544434
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,2048,768,8,128,1,2,power_law_1.2,0.08937600255012512
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,2048,768,8,128,1,2,power_law_1.01,0.11166080236434936
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,2048,768,8,128,1,2,power_law_1.01,0.11678080558776856
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,2048,768,8,128,1,2,balanced,2.7030932108561196
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,2048,768,8,128,1,2,power_law_1.2,0.14245760440826416
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,2048,768,8,128,1,2,power_law_1.01,0.1270591974258423
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,2048,768,8,128,1,2,balanced,2.525925318400065
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,2048,768,8,128,1,2,power_law_1.2,0.14866559505462645
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,2048,768,8,128,1,2,power_law_1.01,0.12981120347976685
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,2048,768,8,128,1,2,power_law_1.2,0.15943679809570313
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,2048,768,8,128,1,2,power_law_1.01,0.13664640188217164
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,2048,768,8,128,1,2,power_law_1.2,0.16600960493087769
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,2048,768,8,128,1,2,power_law_1.01,0.14926079511642457
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,2048,768,8,128,1,2,power_law_1.2,0.16440320014953613
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,2048,768,8,128,1,2,power_law_1.2,0.17147519588470458
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,2048,768,8,128,1,2,power_law_1.2,0.1803712010383606
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,2048,768,8,128,1,2,power_law_1.01,0.16061439514160156
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,2048,768,8,128,1,2,power_law_1.2,0.1816704034805298
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,2048,768,8,128,1,2,power_law_1.01,0.16927360296249389
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,2048,768,8,128,1,2,power_law_1.2,0.1970944046974182
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,2048,768,8,128,1,2,power_law_1.2,0.20619521141052247
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,2048,768,8,128,1,2,power_law_1.2,0.21121280193328856
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,2048,768,8,128,1,2,power_law_1.01,0.17482240200042726
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,2048,768,8,128,1,2,power_law_1.2,0.21760640144348145
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,2048,768,8,128,1,2,power_law_1.01,0.20913920402526856
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,2048,768,8,128,1,2,balanced,5.077306747436523
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,2048,768,8,128,1,2,power_law_1.2,0.26377599239349364
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,2048,768,8,128,1,2,balanced,4.299093246459961
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,2048,768,8,128,1,2,power_law_1.01,0.24237439632415772
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,2048,768,8,128,1,2,power_law_1.2,0.26256000995635986
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,2048,768,8,128,1,2,power_law_1.01,0.32004480361938475
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,2048,768,8,128,1,2,power_law_1.2,0.3000704050064087
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,2048,768,8,128,1,2,power_law_1.01,0.40309758186340333
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,2048,768,8,128,1,2,power_law_1.2,0.35148160457611083
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,2048,768,8,128,1,2,power_law_1.01,0.5412543773651123
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,2048,768,8,128,1,2,power_law_1.2,0.4461696147918701
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,2048,768,8,128,1,2,power_law_1.2,0.5488831996917725
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,2048,768,8,128,1,2,power_law_1.01,0.7016831874847412
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,2048,768,8,128,1,2,power_law_1.2,0.6661375999450684
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,2048,768,8,128,1,2,power_law_1.01,1.0086655616760254
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,2048,768,8,128,1,2,power_law_1.2,0.8818623542785644
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,2048,768,8,128,1,2,power_law_1.01,1.2921728134155273
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,2048,768,8,128,1,2,power_law_1.2,1.322374439239502
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,2048,768,8,128,1,2,power_law_1.01,1.9584575653076173
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,2048,768,8,128,1,2,power_law_1.2,1.5650303840637207
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,2048,768,8,128,1,2,power_law_1.01,2.4675968170166014
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,2048,768,8,128,1,2,power_law_1.2,2.015891265869141
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,2048,768,8,128,1,2,power_law_1.01,2.911270332336426
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,2048,768,8,128,1,2,balanced,4.89138666788737
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,2048,768,8,128,1,2,power_law_1.2,3.3542720794677736
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,2048,768,8,128,1,2,power_law_1.01,5.030118560791015
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,2048,768,8,128,1,2,power_law_1.2,6.799430084228516
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,2048,768,8,128,1,2,power_law_1.01,9.52451171875
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,2048,768,8,128,1,2,balanced,8.538474400838217
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,2048,768,8,128,1,2,power_law_1.2,0.03711360096931458
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,2048,768,8,128,2,1,balanced,0.03288000077009201
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,2048,768,8,128,1,2,power_law_1.2,0.03535360097885132
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,2048,768,8,128,2,1,balanced,0.04402133325735728
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,2048,768,8,128,1,2,power_law_1.2,0.043628799915313723
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,2048,768,8,128,2,1,balanced,0.06261333326498668
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,2048,768,8,128,1,2,power_law_1.2,0.05380480289459229
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,2048,768,8,128,2,1,balanced,0.10098133484522502
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,2048,768,8,128,1,2,power_law_1.2,0.04012799859046936
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,2048,768,8,128,2,1,balanced,0.1678933302561442
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,2048,768,8,128,1,2,power_law_1.2,0.06632959842681885
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,2048,768,8,128,2,1,balanced,0.17140799760818481
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,2048,768,8,128,1,2,power_law_1.2,0.04467200040817261
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,2048,768,8,128,2,1,balanced,0.1725920041402181
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,2048,768,8,128,1,2,power_law_1.2,0.09304320216178893
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,2048,768,8,128,1,2,power_law_1.2,0.04867840111255646
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,2048,768,8,128,2,1,balanced,0.17152533928553262
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,2048,768,8,128,2,1,balanced,0.17270400126775107
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,2048,768,8,128,1,2,power_law_1.2,0.09848319888114929
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,2048,768,8,128,1,2,power_law_1.2,0.05748479962348938
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,2048,768,8,128,2,1,balanced,0.1732213298479716
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,2048,768,8,128,1,2,power_law_1.2,0.10398080348968505
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,2048,768,8,128,1,2,power_law_1.2,0.06722559928894042
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,2048,768,8,128,2,1,balanced,0.17498133579889932
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,2048,768,8,128,2,1,balanced,0.178330659866333
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,2048,768,8,128,1,2,power_law_1.2,0.09930880069732666
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,2048,768,8,128,1,2,power_law_1.2,0.11065599918365479
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,2048,768,8,128,2,1,balanced,0.1801813244819641
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,2048,768,8,128,1,2,power_law_1.2,0.11070719957351685
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,2048,768,8,128,1,2,power_law_1.2,0.1041152000427246
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,2048,768,8,128,2,1,balanced,0.1829813321431478
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,2048,768,8,128,1,2,power_law_1.2,0.11237119436264038
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,2048,768,8,128,1,2,power_law_1.2,0.1065600037574768
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,2048,768,8,128,2,1,balanced,0.1960053245226542
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,2048,768,8,128,1,2,power_law_1.2,0.12147200107574463
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,2048,768,8,128,2,1,balanced,0.20334933201471964
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,2048,768,8,128,1,2,power_law_1.2,0.11588480472564697
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,2048,768,8,128,2,1,balanced,0.21533334255218506
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,2048,768,8,128,1,2,power_law_1.2,0.12104959487915039
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,2048,768,8,128,2,1,balanced,0.23654399315516153
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,2048,768,8,128,1,2,power_law_1.2,0.11947519779205322
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,2048,768,8,128,1,2,power_law_1.2,0.12495360374450684
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,2048,768,8,128,2,1,balanced,0.2592746615409851
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,2048,768,8,128,1,2,power_law_1.2,0.13779200315475465
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,2048,768,8,128,1,2,power_law_1.2,0.12697600126266478
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,2048,768,8,128,1,2,power_law_1.2,0.14487680196762084
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,2048,768,8,128,1,2,power_law_1.2,0.13244160413742065
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,2048,768,8,128,2,1,balanced,0.29227733612060547
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,2048,768,8,128,1,2,power_law_1.2,0.13987840414047242
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,2048,768,8,128,1,2,power_law_1.2,0.15786240100860596
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,2048,768,8,128,2,1,balanced,0.323253333568573
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,2048,768,8,128,1,2,power_law_1.2,0.14773759841918946
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,2048,768,8,128,1,2,power_law_1.2,0.18258559703826904
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,2048,768,8,128,1,2,power_law_1.2,0.19630719423294068
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,2048,768,8,128,2,1,balanced,0.45152533054351807
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,2048,768,8,128,1,2,power_law_1.2,0.2471872091293335
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,2048,768,8,128,1,2,power_law_1.2,0.16321280002593994
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,2048,768,8,128,1,2,power_law_1.2,0.28457601070404054
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,2048,768,8,128,2,1,balanced,0.5122613509496053
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,2048,768,8,128,1,2,power_law_1.2,0.16842880249023437
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,2048,768,8,128,1,2,power_law_1.2,0.3758080005645752
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,2048,768,8,128,1,2,power_law_1.2,0.4689216136932373
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,2048,768,8,128,1,2,power_law_1.2,0.1759104013442993
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,2048,768,8,128,2,1,balanced,0.7256213029225668
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,2048,768,8,128,1,2,power_law_1.2,0.6249536037445068
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,2048,768,8,128,1,2,power_law_1.2,0.2134335994720459
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,2048,768,8,128,1,2,power_law_1.2,0.7865344047546386
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,2048,768,8,128,1,2,power_law_1.2,0.24853758811950682
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,2048,768,8,128,1,2,power_law_1.2,1.1512831687927245
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,2048,768,8,128,1,2,power_law_1.2,0.33438720703125
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,2048,768,8,128,2,1,balanced,0.9461013476053873
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,2048,768,8,128,1,2,power_law_1.2,1.6075263977050782
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,2048,768,8,128,1,2,power_law_1.2,0.4104447841644287
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,2048,768,8,128,1,2,power_law_1.2,2.0022655487060548
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,2048,768,8,128,1,2,power_law_1.2,0.5962495803833008
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,2048,768,8,128,1,2,power_law_1.2,3.132646369934082
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,2048,768,8,128,1,2,power_law_1.2,0.7855552196502685
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,2048,768,8,128,1,2,power_law_1.2,1.091596794128418
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,2048,768,8,128,1,2,power_law_1.2,6.401216125488281
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,2048,768,8,128,1,2,power_law_1.2,1.370969581604004
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,2048,768,8,128,2,1,balanced,1.4117172559102376
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,2048,768,8,128,1,2,power_law_1.2,1.9970880508422852
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,2048,768,8,128,1,2,power_law_1.2,2.6950399398803713
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,2048,768,8,128,1,2,power_law_1.2,3.4800254821777346
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,2048,768,8,128,2,1,balanced,0.037290667494138084
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,2048,768,8,128,1,2,power_law_1.2,5.450553512573242
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,2048,768,8,128,2,1,balanced,1.8652853965759277
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,2048,768,8,128,2,1,balanced,0.03736000011364619
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,2048,768,8,128,2,1,balanced,0.05136533578236898
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,2048,768,8,128,1,2,power_law_1.2,12.292320251464844
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,2048,768,8,128,2,1,balanced,0.07495999832948048
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,2048,768,8,128,2,1,balanced,0.11499733726183574
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,2048,768,8,128,2,1,balanced,0.11635200182596843
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,2048,768,8,128,2,1,balanced,0.11803733309110005
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,2048,768,8,128,2,1,balanced,0.11899200081825256
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,2048,768,8,128,2,1,balanced,0.12012799580891927
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,2048,768,8,128,2,1,balanced,0.1209386686484019
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,2048,768,8,128,2,1,balanced,2.3262507120768228
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,2048,768,8,128,2,1,balanced,0.12406399846076965
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,2048,768,8,128,2,1,balanced,0.12822399536768594
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,2048,768,8,128,2,1,balanced,0.130703995625178
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,2048,768,8,128,2,1,balanced,0.13715733091036478
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,2048,768,8,128,2,1,balanced,0.14402666687965393
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,2048,768,8,128,2,1,balanced,0.1492853363355001
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,2048,768,8,128,2,1,balanced,0.16715200742085776
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,2048,768,8,128,2,1,balanced,0.19144533077875772
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,2048,768,8,128,2,1,power_law_1.01,0.030675199627876282
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,2048,768,8,128,2,1,balanced,0.21304533878962198
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,2048,768,8,128,2,1,power_law_1.01,0.03782399892807007
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,2048,768,8,128,2,1,power_law_1.01,0.0516543984413147
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,2048,768,8,128,2,1,balanced,0.25443732738494873
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,2048,768,8,128,2,1,power_law_1.01,0.07382400035858154
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,2048,768,8,128,2,1,balanced,0.06351999938488007
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,2048,768,8,128,2,1,balanced,0.29253333806991577
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,2048,768,8,128,2,1,power_law_1.01,0.035571199655532834
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,2048,768,8,128,2,1,balanced,3.6548051834106445
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,2048,768,8,128,2,1,power_law_1.01,0.09772160053253173
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,2048,768,8,128,2,1,balanced,0.06489066779613495
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,2048,768,8,128,2,1,power_law_1.01,0.0361407995223999
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,2048,768,8,128,2,1,power_law_1.01,0.14609919786453246
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,2048,768,8,128,2,1,balanced,0.0719946672519048
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,2048,768,8,128,2,1,balanced,0.4249333143234253
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,2048,768,8,128,2,1,power_law_1.01,0.04665600061416626
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,2048,768,8,128,2,1,balanced,0.09018133083979289
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,2048,768,8,128,2,1,power_law_1.01,0.14870400428771974
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,2048,768,8,128,2,1,power_law_1.01,0.061504000425338747
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,2048,768,8,128,2,1,balanced,0.13038399815559387
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,2048,768,8,128,2,1,power_law_1.01,0.1565119981765747
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,2048,768,8,128,2,1,balanced,0.5073013305664062
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,2048,768,8,128,2,1,balanced,0.13482667009035745
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,2048,768,8,128,2,1,power_law_1.01,0.07084800004959106
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,2048,768,8,128,2,1,power_law_1.01,0.16174720525741576
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,2048,768,8,128,2,1,balanced,0.1360053320725759
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,2048,768,8,128,2,1,power_law_1.01,0.09904000163078308
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,2048,768,8,128,2,1,power_law_1.01,0.16962560415267944
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,2048,768,8,128,2,1,balanced,0.1394719978173574
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,2048,768,8,128,2,1,power_law_1.01,0.10387840270996093
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,2048,768,8,128,2,1,balanced,0.7267786661783854
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,2048,768,8,128,2,1,power_law_1.01,0.17557120323181152
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,2048,768,8,128,2,1,balanced,0.14309333761533102
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,2048,768,8,128,2,1,power_law_1.01,0.10743680000305175
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,2048,768,8,128,2,1,power_law_1.01,0.1835263967514038
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,2048,768,8,128,2,1,balanced,0.14396799604098
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,2048,768,8,128,2,1,power_law_1.01,0.11564160585403442
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,2048,768,8,128,2,1,power_law_1.01,0.19153280258178712
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,2048,768,8,128,2,1,balanced,0.14751467108726501
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,2048,768,8,128,2,1,power_law_1.01,0.11666560173034668
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,2048,768,8,128,2,1,balanced,0.15457066893577576
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,2048,768,8,128,2,1,power_law_1.01,0.053427201509475705
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,2048,768,8,128,2,1,power_law_1.01,0.20710399150848388
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,2048,768,8,128,2,1,power_law_1.01,0.12318079471588135
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,2048,768,8,128,2,1,balanced,0.9676746527353922
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,2048,768,8,128,2,1,power_law_1.01,0.13155200481414794
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,2048,768,8,128,2,1,balanced,0.15867732961972555
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,2048,768,8,128,2,1,power_law_1.01,0.22064640522003173
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,2048,768,8,128,2,1,power_law_1.01,0.06388480067253113
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,2048,768,8,128,2,1,balanced,0.164901336034139
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,2048,768,8,128,2,1,power_law_1.01,0.2285759925842285
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,2048,768,8,128,2,1,power_law_1.01,0.13720959424972534
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,2048,768,8,128,2,1,power_law_1.01,0.06910719871520996
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,2048,768,8,128,2,1,power_law_1.01,0.1392575979232788
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,2048,768,8,128,2,1,power_law_1.01,0.22858240604400634
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,2048,768,8,128,2,1,power_law_1.01,0.0785535991191864
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,2048,768,8,128,2,1,power_law_1.01,0.1505728006362915
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,2048,768,8,128,2,1,power_law_1.01,0.08886399865150452
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,2048,768,8,128,2,1,power_law_1.01,0.26353280544281005
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,2048,768,8,128,2,1,power_law_1.01,0.11783679723739623
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,2048,768,8,128,2,1,balanced,1.4679466883341472
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,2048,768,8,128,2,1,power_law_1.01,0.15886720418930053
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,2048,768,8,128,2,1,power_law_1.01,0.28407039642333987
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,2048,768,8,128,2,1,balanced,0.18476267655690512
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,2048,768,8,128,2,1,power_law_1.01,0.12465920448303222
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,2048,768,8,128,2,1,power_law_1.01,0.17627520561218263
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,2048,768,8,128,2,1,power_law_1.01,0.33063039779663084
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,2048,768,8,128,2,1,balanced,0.19031467040379843
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,2048,768,8,128,2,1,power_law_1.01,0.1282495975494385
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,2048,768,8,128,2,1,power_law_1.01,0.2094208002090454
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,2048,768,8,128,2,1,power_law_1.01,0.36739840507507326
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,2048,768,8,128,2,1,power_law_1.01,0.13466880321502686
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,2048,768,8,128,2,1,power_law_1.01,0.23320319652557372
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,2048,768,8,128,2,1,power_law_1.01,0.4793727874755859
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,2048,768,8,128,2,1,power_law_1.01,0.14109439849853517
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,2048,768,8,128,2,1,power_law_1.01,0.28336000442504883
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,2048,768,8,128,2,1,power_law_1.01,0.5665791988372803
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,2048,768,8,128,2,1,power_law_1.01,0.15166079998016357
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,2048,768,8,128,2,1,power_law_1.01,0.3308480024337769
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,2048,768,8,128,2,1,power_law_1.01,0.7721343994140625
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,2048,768,8,128,2,1,power_law_1.01,0.16290559768676757
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,2048,768,8,128,2,1,power_law_1.01,0.4456575870513916
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,2048,768,8,128,2,1,balanced,1.9496533075968425
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,2048,768,8,128,2,1,power_law_1.01,0.9816320419311524
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,2048,768,8,128,2,1,balanced,0.22317334016164145
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,2048,768,8,128,2,1,power_law_1.01,0.1690111994743347
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,2048,768,8,128,2,1,balanced,7.116693496704102
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,2048,768,8,128,2,1,power_law_1.01,0.5476928234100342
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,2048,768,8,128,2,1,power_law_1.01,1.4038528442382812
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,2048,768,8,128,2,1,power_law_1.01,0.18570879697799683
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,2048,768,8,128,2,1,balanced,0.2677653431892395
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,2048,768,8,128,2,1,power_law_1.01,0.770854377746582
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,2048,768,8,128,2,1,power_law_1.01,1.8467391967773437
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,2048,768,8,128,2,1,balanced,0.30034132798512775
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,2048,768,8,128,2,1,power_law_1.01,0.9950592041015625
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,2048,768,8,128,2,1,power_law_1.01,2.2619775772094726
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,2048,768,8,128,2,1,power_law_1.01,0.19854079484939574
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,2048,768,8,128,2,1,power_law_1.01,1.4481472015380858
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,2048,768,8,128,2,1,balanced,0.4302186568578084
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,2048,768,8,128,2,1,power_law_1.01,0.21511681079864503
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,2048,768,8,128,2,1,power_law_1.01,3.529990386962891
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,2048,768,8,128,2,1,power_law_1.01,1.911289596557617
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,2048,768,8,128,2,1,balanced,0.5000906785329183
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,2048,768,8,128,2,1,power_law_1.01,2.3641279220581053
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,2048,768,8,128,2,1,power_law_1.01,7.362188720703125
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,2048,768,8,128,2,1,power_law_1.01,0.22749440670013427
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,2048,768,8,128,2,1,balanced,2.4249653816223145
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,2048,768,8,128,2,1,power_law_1.01,3.7510913848876952
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,2048,768,8,128,2,1,balanced,0.763429323832194
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,2048,768,8,128,2,1,power_law_1.01,0.2815040111541748
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,2048,768,8,128,2,1,power_law_1.01,0.34119040966033937
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,2048,768,8,128,2,1,power_law_1.01,7.771199798583984
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,2048,768,8,128,2,1,power_law_1.01,0.45724802017211913
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,2048,768,8,128,2,1,balanced,0.9256266752878824
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,2048,768,8,128,2,1,power_law_1.01,0.5581823825836182
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,2048,768,8,128,2,1,power_law_1.01,0.7698239803314209
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,2048,768,8,128,2,1,power_law_1.01,0.9836607933044433
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,2048,768,8,128,2,1,balanced,1.3385599454243977
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,2048,768,8,128,2,1,power_law_1.01,1.4018688201904297
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,2048,768,8,128,2,1,power_law_1.01,1.822540855407715
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,2048,768,8,128,2,1,power_law_1.01,2.6601791381835938
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,2048,768,8,128,2,1,balanced,1.763594627380371
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,2048,768,8,128,2,1,power_law_1.01,3.4942462921142576
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,2048,768,8,128,2,1,balanced,3.8601598739624023
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,2048,768,8,128,2,1,power_law_1.01,4.326137542724609
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,2048,768,8,128,2,1,power_law_1.01,6.844012451171875
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,2048,768,8,128,2,1,balanced,2.604863961537679
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,2048,768,8,128,2,1,power_law_1.01,13.510086059570312
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,2048,768,8,128,2,1,power_law_1.2,0.03128319978713989
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,2048,768,8,128,2,1,power_law_1.2,0.037484800815582274
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,2048,768,8,128,2,1,power_law_1.2,0.04718720018863678
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,2048,768,8,128,2,1,power_law_1.2,0.06443520188331604
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,2048,768,8,128,2,1,balanced,3.4457066853841147
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,2048,768,8,128,2,1,power_law_1.2,0.0920960009098053
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,2048,768,8,128,2,1,power_law_1.2,0.1489408016204834
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,2048,768,8,128,2,1,power_law_1.2,0.03558399975299835
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,2048,768,8,128,2,1,power_law_1.2,0.15615999698638916
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,2048,768,8,128,2,1,power_law_1.2,0.03671680092811584
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,2048,768,8,128,2,1,power_law_1.2,0.1644863963127136
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,2048,768,8,128,2,1,power_law_1.2,0.04474239945411682
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,2048,768,8,128,2,1,power_law_1.2,0.16842880249023437
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,2048,768,8,128,2,1,power_law_1.2,0.05588480234146118
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,2048,768,8,128,2,1,power_law_1.2,0.17208319902420044
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,2048,768,8,128,2,1,power_law_1.2,0.06511359810829162
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,2048,768,8,128,2,1,power_law_1.2,0.18012800216674804
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,2048,768,8,128,2,1,power_law_1.2,0.10127359628677368
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,2048,768,8,128,2,1,power_law_1.2,0.18575359582901002
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,2048,768,8,128,2,1,power_law_1.2,0.10558079481124878
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,2048,768,8,128,2,1,balanced,4.283391952514648
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,2048,768,8,128,2,1,power_law_1.2,0.19702399969100953
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,2048,768,8,128,2,1,power_law_1.2,0.11256320476531982
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,2048,768,8,128,2,1,power_law_1.2,0.2141119956970215
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,2048,768,8,128,2,1,power_law_1.2,0.11696000099182129
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,2048,768,8,128,2,1,power_law_1.2,0.21969919204711913
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,2048,768,8,128,2,1,power_law_1.2,0.11766400337219238
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,2048,768,8,128,2,1,power_law_1.2,0.23001599311828613
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,2048,768,8,128,2,1,power_law_1.2,0.1254464030265808
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,2048,768,8,128,2,1,power_law_1.2,0.23687679767608644
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,2048,768,8,128,2,1,balanced,7.5867570241292315
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,2048,768,8,128,2,1,power_law_1.2,0.13418879508972167
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,2048,768,8,128,2,1,power_law_1.2,0.2693824052810669
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,2048,768,8,128,2,1,power_law_1.2,0.1393728017807007
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,2048,768,8,128,2,1,power_law_1.2,0.28739199638366697
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,2048,768,8,128,2,1,power_law_1.2,0.14198399782180787
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,2048,768,8,128,2,1,power_law_1.2,0.33464319705963136
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,2048,768,8,128,2,1,power_law_1.2,0.1519871950149536
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,2048,768,8,128,2,1,power_law_1.2,0.3874495983123779
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,2048,768,8,128,2,1,power_law_1.2,0.16240639686584474
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,2048,768,8,128,2,1,power_law_1.2,0.4871551990509033
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,2048,768,8,128,2,1,power_law_1.2,0.18127360343933105
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,2048,768,8,128,2,1,power_law_1.2,0.593932819366455
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,2048,768,8,128,2,1,balanced,6.809520085652669
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,2048,768,8,128,2,1,power_law_1.2,0.21191039085388183
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,2048,768,8,128,2,1,power_law_1.2,0.7822336196899414
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,2048,768,8,128,2,1,power_law_1.2,0.23401598930358886
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,2048,768,8,128,2,1,power_law_1.2,0.9889727592468261
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,2048,768,8,128,2,1,power_law_1.2,0.28562560081481936
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,2048,768,8,128,2,1,power_law_1.2,1.414956760406494
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,2048,768,8,128,2,1,power_law_1.2,0.3403968095779419
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,2048,768,8,128,2,1,power_law_1.2,1.8699392318725585
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,2048,768,8,128,2,1,power_law_1.2,0.44737920761108396
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,2048,768,8,128,2,1,power_law_1.2,2.2979711532592773
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,2048,768,8,128,2,1,power_law_1.2,0.5547327995300293
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,2048,768,8,128,2,1,power_law_1.2,0.7754623889923096
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,2048,768,8,128,2,1,power_law_1.2,3.559212875366211
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,2048,768,8,128,2,1,power_law_1.2,0.9924799919128418
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,2048,768,8,128,2,1,power_law_1.2,1.455020809173584
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,2048,768,8,128,2,1,power_law_1.2,7.435513305664062
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,2048,768,8,128,2,1,power_law_1.2,1.9175552368164062
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,2048,768,8,128,2,1,power_law_1.2,2.378508758544922
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,2048,768,8,128,2,1,power_law_1.2,3.7687423706054686
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,2048,768,8,128,2,1,power_law_1.2,7.9300994873046875
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,2048,768,8,128,2,1,balanced,13.481781005859375
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,2048,768,8,128,2,1,power_law_1.2,0.05493760108947754
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,2048,768,8,128,2,1,power_law_1.2,0.06451839804649354
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,2048,768,8,128,2,1,power_law_1.2,0.06722559928894042
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,2048,768,8,128,2,1,power_law_1.2,0.0773248016834259
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,2048,768,8,128,2,1,power_law_1.2,0.08664960265159607
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,4096,1536,8,128,1,2,balanced,0.05049066742261251
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,2048,768,8,128,2,1,power_law_1.2,0.11793919801712036
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,4096,1536,8,128,1,2,balanced,0.067930668592453
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,4096,1536,8,128,1,2,balanced,0.06741333504517873
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,2048,768,8,128,2,1,power_law_1.2,0.12351360321044921
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,4096,1536,8,128,1,2,balanced,0.09752532839775085
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,4096,1536,8,128,1,2,balanced,0.10110933581988017
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,2048,768,8,128,2,1,power_law_1.2,0.12982399463653566
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,4096,1536,8,128,1,2,balanced,0.16741865873336792
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,4096,1536,8,128,1,2,balanced,0.1749066710472107
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,2048,768,8,128,2,1,power_law_1.2,0.13860479593276978
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,4096,1536,8,128,1,2,balanced,0.3038613398869832
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,4096,1536,8,128,1,2,balanced,0.3128053347269694
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,2048,768,8,128,2,1,power_law_1.2,0.14326399564743042
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,4096,1536,8,128,1,2,balanced,0.5793600082397461
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,4096,1536,8,128,1,2,balanced,0.3165760040283203
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,2048,768,8,128,2,1,power_law_1.2,0.1524415969848633
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,4096,1536,8,128,1,2,balanced,0.5925333499908447
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,4096,1536,8,128,1,2,balanced,0.32020799318949383
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,2048,768,8,128,2,1,power_law_1.2,0.1628543972969055
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,4096,1536,8,128,1,2,balanced,0.592416008313497
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,4096,1536,8,128,1,2,balanced,0.320415993531545
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,2048,768,8,128,2,1,power_law_1.2,0.16872960329055786
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,4096,1536,8,128,1,2,balanced,0.5867466529210409
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,4096,1536,8,128,1,2,balanced,0.32148265838623047
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,2048,768,8,128,2,1,power_law_1.2,0.18710399866104127
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,4096,1536,8,128,1,2,balanced,0.5865866740544637
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,4096,1536,8,128,1,2,balanced,0.32472000519434613
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,4096,1536,8,128,1,2,balanced,0.588645339012146
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,4096,1536,8,128,1,2,balanced,0.3286400039990743
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,2048,768,8,128,2,1,power_law_1.2,0.2019968032836914
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,4096,1536,8,128,1,2,balanced,0.33298667271931964
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,4096,1536,8,128,1,2,balanced,0.5928906599680582
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,2048,768,8,128,2,1,power_law_1.2,0.21831040382385253
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,4096,1536,8,128,1,2,balanced,0.5974453290303549
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,4096,1536,8,128,1,2,balanced,0.33612799644470215
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,4096,1536,8,128,1,2,balanced,0.5984266599019369
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,4096,1536,8,128,1,2,balanced,0.3415306806564331
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,4096,1536,8,128,1,2,balanced,0.6022826830546061
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,2048,768,8,128,2,1,power_law_1.2,0.23134078979492187
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,4096,1536,8,128,1,2,balanced,0.35277867317199707
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,2048,768,8,128,2,1,power_law_1.2,0.27929599285125734
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,4096,1536,8,128,1,2,balanced,0.6309653520584106
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,4096,1536,8,128,1,2,balanced,0.3556266625722249
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,2048,768,8,128,2,1,power_law_1.2,0.3419584035873413
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,4096,1536,8,128,1,2,balanced,0.6356746753056844
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,4096,1536,8,128,1,2,balanced,0.3718239863713582
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,4096,1536,8,128,1,2,balanced,0.05434666574001312
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,2048,768,8,128,2,1,power_law_1.2,0.4619135856628418
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,4096,1536,8,128,1,2,balanced,0.6569386720657349
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,4096,1536,8,128,1,2,balanced,0.07158400118350983
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,4096,1536,8,128,1,2,balanced,0.39211201667785645
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,2048,768,8,128,2,1,power_law_1.2,0.5637184143066406
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,4096,1536,8,128,1,2,balanced,0.10564266641934712
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,4096,1536,8,128,1,2,balanced,0.6737759908040365
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,4096,1536,8,128,1,2,balanced,0.17697066068649292
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,2048,768,8,128,2,1,power_law_1.2,0.7773312091827392
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,4096,1536,8,128,1,2,balanced,0.42474134763081867
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,4096,1536,8,128,1,2,balanced,0.32098132371902466
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,4096,1536,8,128,1,2,balanced,0.3221386671066284
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,2048,768,8,128,2,1,power_law_1.2,0.9837823867797851
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,4096,1536,8,128,1,2,balanced,0.7103786468505859
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,4096,1536,8,128,1,2,balanced,0.46487998962402344
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,4096,1536,8,128,1,2,balanced,0.32371199131011963
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,4096,1536,8,128,1,2,balanced,0.3266613284746806
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,2048,768,8,128,2,1,power_law_1.2,1.4023679733276366
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,4096,1536,8,128,1,2,balanced,0.7470986843109131
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,4096,1536,8,128,1,2,balanced,0.3298506736755371
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,4096,1536,8,128,1,2,balanced,0.5026826858520508
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,2048,768,8,128,2,1,power_law_1.2,1.8227455139160156
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,4096,1536,8,128,1,2,balanced,0.3326080044110616
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,4096,1536,8,128,1,2,balanced,0.3378133376439412
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,4096,1536,8,128,1,2,balanced,0.7803306579589844
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,2048,768,8,128,2,1,power_law_1.2,2.661337661743164
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,4096,1536,8,128,1,2,balanced,0.34482133388519287
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,4096,1536,8,128,1,2,balanced,0.6801386674245199
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,4096,1536,8,128,1,2,balanced,0.3514773448308309
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,2048,768,8,128,2,1,power_law_1.2,3.4966079711914064
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,4096,1536,8,128,1,2,balanced,0.3612746795018514
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,4096,1536,8,128,1,2,balanced,1.007263978322347
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,2048,768,8,128,2,1,power_law_1.2,4.334131240844727
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,4096,1536,8,128,1,2,balanced,0.772981325785319
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,2048,768,8,128,2,1,power_law_1.2,6.827232360839844
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,4096,1536,8,128,1,2,balanced,1.0808906555175781
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,4096,1536,8,128,1,2,balanced,0.3776586850484212
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,4096,1536,8,128,1,2,balanced,1.0900426705678303
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,4096,1536,8,128,1,2,balanced,0.3845813274383545
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,2048,768,8,128,2,1,power_law_1.2,13.531027221679688
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,4096,1536,8,128,1,2,power_law_1.01,0.09526399970054626
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,4096,1536,8,128,1,2,balanced,1.5037013689676921
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,4096,1536,8,128,1,2,power_law_1.01,0.0972927987575531
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,4096,1536,8,128,1,2,power_law_1.01,0.12362240552902222
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,4096,1536,8,128,1,2,balanced,1.4020427068074544
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,4096,1536,8,128,1,2,power_law_1.01,0.22055680751800538
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,4096,1536,8,128,1,2,power_law_1.01,0.29900801181793213
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,4096,1536,8,128,1,2,balanced,1.9628000259399414
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,4096,1536,8,128,1,2,power_law_1.01,0.49047040939331055
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,4096,1536,8,128,1,2,balanced,0.4193546772003174
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,4096,1536,8,128,1,2,power_law_1.01,0.5167935848236084
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,4096,1536,8,128,1,2,balanced,0.46773866812388104
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,4096,1536,8,128,1,2,power_law_1.01,0.5426368236541748
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,4096,1536,8,128,1,2,balanced,2.030277411142985
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,4096,1536,8,128,1,2,balanced,0.5146239995956421
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,4096,1536,8,128,1,2,power_law_1.01,0.5551040172576904
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,4096,1536,8,128,1,2,power_law_1.01,0.5631040096282959
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,4096,1536,8,128,1,2,balanced,0.6664586861928304
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,4096,1536,8,128,1,2,balanced,2.861760139465332
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,4096,1536,8,128,1,2,power_law_1.01,0.571673583984375
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,4096,1536,8,128,1,2,power_law_1.01,0.5946432113647461
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,4096,1536,8,128,1,2,balanced,0.7476800282796224
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,4096,1536,8,128,1,2,power_law_1.01,0.5918015956878662
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,4096,1536,8,128,1,2,power_law_1.01,0.612179183959961
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,4096,1536,8,128,1,2,balanced,1.146773338317871
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,4096,1536,8,128,1,2,power_law_1.01,0.6458240032196045
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,4096,1536,8,128,1,2,power_law_1.01,0.6841599941253662
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,4096,1536,8,128,1,2,power_law_1.01,0.7041855812072754
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,4096,1536,8,128,1,2,balanced,2.6750081380208335
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,4096,1536,8,128,1,2,balanced,1.316383997599284
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,4096,1536,8,128,1,2,power_law_1.01,0.7779327869415283
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,4096,1536,8,128,1,2,power_law_1.01,0.7674496173858643
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,4096,1536,8,128,1,2,balanced,3.779381434122721
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,4096,1536,8,128,1,2,power_law_1.01,0.8841471672058105
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,4096,1536,8,128,1,2,balanced,1.9167200724283855
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,4096,1536,8,128,1,2,power_law_1.01,0.9777728080749511
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,4096,1536,8,128,1,2,power_law_1.01,0.06598399877548218
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,4096,1536,8,128,1,2,power_law_1.01,1.2217984199523926
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,4096,1536,8,128,1,2,power_law_1.01,0.060524797439575194
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,4096,1536,8,128,1,2,power_law_1.01,1.5047552108764648
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,4096,1536,8,128,1,2,power_law_1.01,0.09338240027427673
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,4096,1536,8,128,1,2,balanced,2.5419626235961914
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,4096,1536,8,128,1,2,power_law_1.01,2.03753604888916
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,4096,1536,8,128,1,2,power_law_1.01,0.1384511947631836
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,4096,1536,8,128,1,2,power_law_1.01,2.617286491394043
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,4096,1536,8,128,1,2,balanced,3.330810546875
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,4096,1536,8,128,1,2,power_law_1.01,0.17055360078811646
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,4096,1536,8,128,1,2,power_law_1.01,0.07545599937438965
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,4096,1536,8,128,1,2,power_law_1.01,0.2678656101226807
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,4096,1536,8,128,1,2,power_law_1.01,3.4884353637695313
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,4096,1536,8,128,1,2,power_law_1.01,0.07073280215263367
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,4096,1536,8,128,1,2,power_law_1.01,0.28199679851531984
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,4096,1536,8,128,1,2,balanced,4.761061350504558
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,4096,1536,8,128,1,2,power_law_1.01,4.480934524536133
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,4096,1536,8,128,1,2,power_law_1.01,0.09522560238838196
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,4096,1536,8,128,1,2,power_law_1.01,0.29344639778137205
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,4096,1536,8,128,1,2,power_law_1.01,0.12906240224838256
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,4096,1536,8,128,1,2,balanced,3.791685422261556
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,4096,1536,8,128,1,2,power_law_1.01,0.29390079975128175
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,4096,1536,8,128,1,2,power_law_1.01,5.452646255493164
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,4096,1536,8,128,1,2,power_law_1.01,0.1768447995185852
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,4096,1536,8,128,1,2,power_law_1.01,0.30005760192871095
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,4096,1536,8,128,1,2,power_law_1.01,8.221804809570312
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,4096,1536,8,128,1,2,power_law_1.01,0.31765758991241455
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,4096,1536,8,128,1,2,power_law_1.01,0.28096001148223876
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,4096,1536,8,128,1,2,power_law_1.01,0.32522239685058596
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,4096,1536,8,128,1,2,power_law_1.01,0.2911616086959839
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,4096,1536,8,128,1,2,power_law_1.01,0.342739200592041
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,4096,1536,8,128,1,2,power_law_1.01,0.3054527997970581
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,4096,1536,8,128,1,2,power_law_1.01,16.564166259765624
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,4096,1536,8,128,1,2,power_law_1.01,0.33692800998687744
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,4096,1536,8,128,1,2,power_law_1.01,0.31562879085540774
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,4096,1536,8,128,1,2,power_law_1.01,0.3678272008895874
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,4096,1536,8,128,1,2,power_law_1.01,0.33296639919281007
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,4096,1536,8,128,1,2,power_law_1.01,0.3881472110748291
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,4096,1536,8,128,1,2,balanced,5.0396318435668945
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,4096,1536,8,128,1,2,power_law_1.2,0.09105920195579528
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,4096,1536,8,128,1,2,power_law_1.01,0.35671679973602294
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,4096,1536,8,128,1,2,power_law_1.01,0.3825727939605713
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,4096,1536,8,128,1,2,power_law_1.01,0.44403839111328125
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,4096,1536,8,128,1,2,power_law_1.01,0.379366397857666
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,4096,1536,8,128,1,2,power_law_1.2,0.07437440156936645
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,4096,1536,8,128,1,2,balanced,5.29860273996989
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,4096,1536,8,128,1,2,power_law_1.01,0.4884672164916992
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,4096,1536,8,128,1,2,power_law_1.01,0.38839681148529054
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,4096,1536,8,128,1,2,power_law_1.2,0.12511999607086183
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,4096,1536,8,128,1,2,power_law_1.01,0.5446400165557861
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,4096,1536,8,128,1,2,power_law_1.01,0.42749438285827634
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,4096,1536,8,128,1,2,power_law_1.2,0.18469120264053346
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,4096,1536,8,128,1,2,balanced,7.383877436319987
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,4096,1536,8,128,1,2,power_law_1.01,0.6312575817108155
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,4096,1536,8,128,1,2,power_law_1.2,0.27245440483093264
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,4096,1536,8,128,1,2,power_law_1.01,0.7720320224761963
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,4096,1536,8,128,1,2,power_law_1.2,0.5007936000823975
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,4096,1536,8,128,1,2,power_law_1.01,0.42080001831054686
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,4096,1536,8,128,1,2,power_law_1.01,0.9253312110900879
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,4096,1536,8,128,1,2,power_law_1.2,0.5508800029754639
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,4096,1536,8,128,1,2,power_law_1.01,0.46277761459350586
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,4096,1536,8,128,1,2,balanced,6.282538731892903
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,4096,1536,8,128,1,2,power_law_1.01,1.2810175895690918
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,4096,1536,8,128,1,2,power_law_1.2,0.5474048137664795
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,4096,1536,8,128,1,2,power_law_1.01,1.727027130126953
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,4096,1536,8,128,1,2,power_law_1.2,0.5522175788879394
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,4096,1536,8,128,1,2,power_law_1.01,2.4411008834838865
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,4096,1536,8,128,1,2,power_law_1.01,0.46399998664855957
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,4096,1536,8,128,1,2,power_law_1.2,0.5731264114379883
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,4096,1536,8,128,1,2,power_law_1.01,3.006092834472656
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,4096,1536,8,128,1,2,power_law_1.01,0.5437119960784912
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,4096,1536,8,128,1,2,power_law_1.2,0.5743231773376465
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,4096,1536,8,128,1,2,power_law_1.01,0.6595392227172852
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,4096,1536,8,128,1,2,power_law_1.01,4.026380920410157
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,4096,1536,8,128,1,2,power_law_1.2,0.583513593673706
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,4096,1536,8,128,1,2,power_law_1.01,0.7900991916656495
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,4096,1536,8,128,1,2,power_law_1.2,0.6047743797302246
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,4096,1536,8,128,1,2,power_law_1.01,6.15747184753418
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,4096,1536,8,128,1,2,power_law_1.2,0.6497983932495117
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,4096,1536,8,128,1,2,power_law_1.01,0.9888256072998047
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,4096,1536,8,128,1,2,power_law_1.2,0.6661439895629883
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,4096,1536,8,128,1,2,power_law_1.01,1.3104063987731933
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,4096,1536,8,128,1,2,power_law_1.01,11.768185424804688
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,4096,1536,8,128,1,2,power_law_1.2,0.6949312210083007
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,4096,1536,8,128,1,2,power_law_1.01,1.7258176803588867
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,4096,1536,8,128,1,2,power_law_1.2,0.7110335826873779
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,4096,1536,8,128,1,2,power_law_1.01,2.358336067199707
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,4096,1536,8,128,1,2,power_law_1.2,0.8234047889709473
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,4096,1536,8,128,1,2,power_law_1.01,3.001420783996582
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,4096,1536,8,128,1,2,power_law_1.2,0.7892223834991455
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,4096,1536,8,128,1,2,balanced,10.043584187825521
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,4096,1536,8,128,1,2,power_law_1.2,0.9080256462097168
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,4096,1536,8,128,1,2,power_law_1.01,4.401023864746094
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,4096,1536,8,128,1,2,power_law_1.2,1.0562944412231445
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,4096,1536,8,128,1,2,power_law_1.01,5.990329742431641
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,4096,1536,8,128,1,2,power_law_1.2,1.2863679885864259
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,4096,1536,8,128,1,2,power_law_1.01,7.55823974609375
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,4096,1536,8,128,1,2,power_law_1.2,1.4843647956848145
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,4096,1536,8,128,1,2,power_law_1.01,11.161177825927734
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,4096,1536,8,128,1,2,balanced,10.534847895304361
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,4096,1536,8,128,1,2,power_law_1.2,2.169561576843262
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,4096,1536,8,128,1,2,power_law_1.2,2.7116416931152343
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,4096,1536,8,128,1,2,power_law_1.2,3.5833152770996093
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,4096,1536,8,128,1,2,power_law_1.01,22.738790893554686
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,4096,1536,8,128,1,2,balanced,14.701109568277994
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,4096,1536,8,128,1,2,power_law_1.2,4.7590782165527346
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,4096,1536,8,128,1,2,power_law_1.2,6.054886245727539
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,4096,1536,8,128,1,2,power_law_1.2,0.06672000288963317
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,4096,1536,8,128,1,2,power_law_1.2,9.955225372314453
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,4096,1536,8,128,1,2,power_law_1.2,0.05878400206565857
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,4096,1536,8,128,1,2,power_law_1.2,0.07420799732208253
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,4096,1536,8,128,1,2,power_law_1.2,19.54761657714844
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,4096,1536,8,128,1,2,power_law_1.2,0.11324160099029541
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,4096,1536,8,128,1,2,power_law_1.2,0.1420799970626831
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,4096,1536,8,128,1,2,power_law_1.2,0.2673919916152954
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,4096,1536,8,128,1,2,power_law_1.2,0.29324800968170167
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,4096,1536,8,128,1,2,power_law_1.2,0.2973376035690308
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,4096,1536,8,128,1,2,power_law_1.2,0.30548479557037356
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,4096,1536,8,128,1,2,power_law_1.2,0.318124794960022
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,4096,1536,8,128,1,2,power_law_1.2,0.32033278942108157
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,4096,1536,8,128,1,2,balanced,20.193514506022137
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,4096,1536,8,128,1,2,power_law_1.2,0.34099841117858887
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,4096,1536,8,128,1,2,power_law_1.2,0.3442368030548096
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,4096,1536,8,128,1,2,power_law_1.2,0.36355199813842776
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,4096,1536,8,128,1,2,power_law_1.2,0.3777343988418579
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,4096,1536,8,128,1,2,power_law_1.2,0.39701759815216064
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,4096,1536,8,128,1,2,power_law_1.2,0.40502400398254396
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,4096,1536,8,128,1,2,power_law_1.2,0.461516809463501
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,4096,1536,8,128,1,2,power_law_1.2,0.47945599555969237
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,4096,1536,8,128,1,2,power_law_1.2,0.5709760189056396
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,4096,1536,8,128,1,2,power_law_1.2,0.6681280136108398
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,4096,1536,8,128,1,2,power_law_1.2,0.8347711563110352
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,4096,1536,8,128,1,2,power_law_1.2,1.0011967658996581
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,4096,1536,8,128,1,2,power_law_1.2,1.2974783897399902
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,4096,1536,8,128,1,2,power_law_1.2,1.901299285888672
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,4096,1536,8,128,1,2,power_law_1.2,2.4482751846313477
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,4096,1536,8,128,1,2,power_law_1.2,3.5986560821533202
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,4096,1536,8,128,1,2,power_law_1.2,4.256825637817383
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,4096,1536,8,128,1,2,power_law_1.2,6.349760055541992
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,4096,1536,8,128,1,2,power_law_1.2,14.071347045898438
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,4096,1536,8,128,1,2,power_law_1.2,0.07552639842033386
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,4096,1536,8,128,1,2,power_law_1.2,0.06647679805755616
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,4096,1536,8,128,1,2,power_law_1.2,0.09354239702224731
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,4096,1536,8,128,1,2,power_law_1.2,0.12918399572372435
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,4096,1536,8,128,1,2,power_law_1.2,0.15304960012435914
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,4096,1536,8,128,1,2,power_law_1.2,0.27431039810180663
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,4096,1536,8,128,1,2,power_law_1.2,0.2859328031539917
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,4096,1536,8,128,1,2,power_law_1.2,0.31366400718688964
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,4096,1536,8,128,1,2,power_law_1.2,0.3251391887664795
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,4096,1536,8,128,1,2,power_law_1.2,0.3328768014907837
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,4096,1536,8,128,1,2,power_law_1.2,0.3481152057647705
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,4096,1536,8,128,1,2,power_law_1.2,0.38241279125213623
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,4096,1536,8,128,1,2,power_law_1.2,0.3966655969619751
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,4096,1536,8,128,1,2,power_law_1.2,0.4291584014892578
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,4096,1536,8,128,1,2,power_law_1.2,0.43157119750976564
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,4096,1536,8,128,1,2,power_law_1.2,0.46027522087097167
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,4096,1536,8,128,2,1,balanced,0.06834133466084798
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,4096,1536,8,128,2,1,balanced,0.09861333171526591
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,4096,1536,8,128,2,1,balanced,0.17004267374674478
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,4096,1536,8,128,1,2,power_law_1.2,0.4613952159881592
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,4096,1536,8,128,2,1,balanced,0.3142133355140686
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,4096,1536,8,128,2,1,balanced,0.5826880137125651
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,4096,1536,8,128,1,2,power_law_1.2,0.542195177078247
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,4096,1536,8,128,2,1,balanced,0.585589329401652
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,4096,1536,8,128,1,2,power_law_1.2,0.6677887916564942
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,4096,1536,8,128,2,1,balanced,0.589141329129537
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,4096,1536,8,128,2,1,balanced,0.5944639841715494
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,4096,1536,8,128,1,2,power_law_1.2,0.8146240234375
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,4096,1536,8,128,2,1,balanced,0.5947200059890747
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,4096,1536,8,128,2,1,balanced,0.051594664653142296
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,4096,1536,8,128,1,2,power_law_1.2,0.9674240112304687
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,4096,1536,8,128,2,1,balanced,0.5970933437347412
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,4096,1536,8,128,2,1,balanced,0.5994240045547485
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,4096,1536,8,128,2,1,balanced,0.06797333558400472
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,4096,1536,8,128,1,2,power_law_1.2,1.399782371520996
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,4096,1536,8,128,2,1,balanced,0.6060959895451864
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,4096,1536,8,128,2,1,balanced,0.10380799571673076
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,4096,1536,8,128,1,2,power_law_1.2,1.9378240585327149
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,4096,1536,8,128,2,1,balanced,0.17642132441202799
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,4096,1536,8,128,2,1,balanced,0.6093066533406576
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,4096,1536,8,128,2,1,balanced,0.31618666648864746
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,4096,1536,8,128,1,2,power_law_1.2,2.4082239151000975
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,4096,1536,8,128,2,1,balanced,0.618773341178894
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,4096,1536,8,128,2,1,balanced,0.3214026689529419
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,4096,1536,8,128,1,2,power_law_1.2,3.449747085571289
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,4096,1536,8,128,2,1,balanced,0.6478186845779419
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,4096,1536,8,128,2,1,balanced,0.3260106643040975
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,4096,1536,8,128,2,1,balanced,0.6552533308664957
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,4096,1536,8,128,2,1,balanced,0.3275573253631592
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,4096,1536,8,128,1,2,power_law_1.2,4.646854400634766
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,4096,1536,8,128,2,1,balanced,0.33003199100494385
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,4096,1536,8,128,2,1,balanced,0.6695733070373535
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,4096,1536,8,128,2,1,power_law_1.01,0.06297600269317627
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,4096,1536,8,128,1,2,power_law_1.2,6.235270309448242
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,4096,1536,8,128,2,1,balanced,0.3350133498509725
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,4096,1536,8,128,2,1,balanced,0.7123146851857504
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,4096,1536,8,128,2,1,power_law_1.01,0.07007359862327575
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,4096,1536,8,128,2,1,balanced,0.33881068229675293
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,4096,1536,8,128,1,2,power_law_1.2,7.2924354553222654
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,4096,1536,8,128,2,1,balanced,0.7574666341145834
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,4096,1536,8,128,2,1,balanced,0.3436266581217448
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,4096,1536,8,128,2,1,power_law_1.01,0.1384768009185791
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,4096,1536,8,128,2,1,balanced,0.348688006401062
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,4096,1536,8,128,2,1,power_law_1.01,0.2056704044342041
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,4096,1536,8,128,2,1,balanced,0.8197387059529623
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,4096,1536,8,128,2,1,balanced,0.36214399337768555
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,4096,1536,8,128,1,2,power_law_1.2,13.65716552734375
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,4096,1536,8,128,2,1,power_law_1.01,0.28323841094970703
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,4096,1536,8,128,2,1,balanced,0.0740586668252945
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,4096,1536,8,128,2,1,balanced,0.3708053429921468
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,4096,1536,8,128,2,1,power_law_1.01,0.04856959879398346
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,4096,1536,8,128,2,1,balanced,0.8812533219655355
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,4096,1536,8,128,2,1,power_law_1.01,0.49013118743896483
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,4096,1536,8,128,2,1,balanced,0.08830933769543965
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,4096,1536,8,128,2,1,balanced,0.38097067674001056
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,4096,1536,8,128,2,1,power_law_1.01,0.054688000679016115
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,4096,1536,8,128,2,1,power_law_1.01,0.5014143943786621
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,4096,1536,8,128,1,2,power_law_1.2,24.902560424804687
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,4096,1536,8,128,2,1,balanced,0.12019733587900798
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,4096,1536,8,128,2,1,balanced,0.40992534160614014
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,4096,1536,8,128,2,1,balanced,1.133786678314209
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,4096,1536,8,128,2,1,power_law_1.01,0.08385279774665833
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,4096,1536,8,128,2,1,power_law_1.01,0.5324992179870606
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,4096,1536,8,128,2,1,balanced,0.19179733594258627
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,4096,1536,8,128,2,1,balanced,0.44673065344492596
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,4096,1536,8,128,2,1,power_law_1.01,0.13148159980773927
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,4096,1536,8,128,2,1,power_law_1.01,0.5378496170043945
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,4096,1536,8,128,2,1,balanced,0.33849068482716876
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,4096,1536,8,128,2,1,power_law_1.01,0.16412160396575928
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,4096,1536,8,128,2,1,balanced,0.48096001148223877
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,4096,1536,8,128,2,1,balanced,1.2712960243225098
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,4096,1536,8,128,2,1,power_law_1.01,0.5609920024871826
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,4096,1536,8,128,2,1,balanced,0.343231995900472
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,4096,1536,8,128,2,1,power_law_1.01,0.2663615942001343
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,4096,1536,8,128,2,1,power_law_1.01,0.5735551834106445
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,4096,1536,8,128,2,1,balanced,0.5476053158442179
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,4096,1536,8,128,2,1,balanced,0.3466026782989502
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,4096,1536,8,128,2,1,power_law_1.01,0.28339200019836425
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,4096,1536,8,128,2,1,power_law_1.01,0.5879615783691406
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,4096,1536,8,128,2,1,balanced,0.35174934069315594
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,4096,1536,8,128,2,1,power_law_1.01,0.289305591583252
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,4096,1536,8,128,2,1,balanced,0.6174879868825277
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,4096,1536,8,128,2,1,balanced,1.7906187375386555
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,4096,1536,8,128,2,1,balanced,0.35836267471313477
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,4096,1536,8,128,2,1,power_law_1.01,0.6042304039001465
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,4096,1536,8,128,2,1,power_law_1.01,0.3046528100967407
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,4096,1536,8,128,2,1,balanced,0.36238932609558105
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,4096,1536,8,128,2,1,power_law_1.01,0.652947187423706
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,4096,1536,8,128,2,1,power_law_1.01,0.30921599864959715
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,4096,1536,8,128,2,1,power_law_1.01,0.07152000069618225
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,4096,1536,8,128,2,1,balanced,0.8529280026753744
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,4096,1536,8,128,2,1,balanced,0.37087468306223553
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,4096,1536,8,128,2,1,power_law_1.01,0.3350271940231323
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,4096,1536,8,128,2,1,power_law_1.01,0.6745279788970947
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,4096,1536,8,128,2,1,power_law_1.01,0.07964800000190735
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,4096,1536,8,128,2,1,balanced,0.3821760018666585
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,4096,1536,8,128,2,1,power_law_1.01,0.34815359115600586
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,4096,1536,8,128,2,1,power_law_1.01,0.10088319778442383
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,4096,1536,8,128,2,1,power_law_1.01,0.6981247901916504
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,4096,1536,8,128,2,1,balanced,2.3242506980895996
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,4096,1536,8,128,2,1,balanced,0.988159974416097
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,4096,1536,8,128,2,1,power_law_1.01,0.13889919519424437
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,4096,1536,8,128,2,1,balanced,0.390394647916158
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,4096,1536,8,128,2,1,power_law_1.01,0.36973440647125244
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,4096,1536,8,128,2,1,power_law_1.01,0.7213376045227051
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,4096,1536,8,128,2,1,power_law_1.01,0.18254719972610473
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,4096,1536,8,128,2,1,power_law_1.01,0.3706559896469116
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,4096,1536,8,128,2,1,balanced,0.40461333592732746
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,4096,1536,8,128,2,1,power_law_1.01,0.2867136001586914
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,4096,1536,8,128,2,1,power_law_1.01,0.8248512268066406
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,4096,1536,8,128,2,1,power_law_1.01,0.38283519744873046
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,4096,1536,8,128,2,1,power_law_1.01,0.30247681140899657
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,4096,1536,8,128,2,1,balanced,1.420570691426595
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,4096,1536,8,128,2,1,power_law_1.01,0.792742395401001
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,4096,1536,8,128,2,1,power_law_1.01,0.4071936130523682
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,4096,1536,8,128,2,1,power_law_1.01,0.3185472011566162
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,4096,1536,8,128,2,1,power_law_1.01,0.3374975919723511
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,4096,1536,8,128,2,1,power_law_1.01,0.4165823936462402
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,4096,1536,8,128,2,1,power_law_1.01,0.8931839942932129
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,4096,1536,8,128,2,1,power_law_1.01,0.3540800094604492
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,4096,1536,8,128,2,1,balanced,3.412720044453939
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,4096,1536,8,128,2,1,power_law_1.01,0.4775551795959473
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,4096,1536,8,128,2,1,power_law_1.01,1.026905632019043
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,4096,1536,8,128,2,1,balanced,0.4330720106760661
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,4096,1536,8,128,2,1,power_law_1.01,0.3842367887496948
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,4096,1536,8,128,2,1,power_law_1.01,0.5225279808044434
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,4096,1536,8,128,2,1,power_law_1.01,0.40974721908569334
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,4096,1536,8,128,2,1,power_law_1.01,1.2838784217834474
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,4096,1536,8,128,2,1,balanced,0.44762134552001953
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,4096,1536,8,128,2,1,power_law_1.01,0.6160192012786865
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,4096,1536,8,128,2,1,power_law_1.01,0.42731518745422364
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,4096,1536,8,128,2,1,balanced,1.881216049194336
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,4096,1536,8,128,2,1,power_law_1.01,0.4727424144744873
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,4096,1536,8,128,2,1,power_law_1.01,1.537600040435791
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,4096,1536,8,128,2,1,power_law_1.01,0.7112512111663818
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,4096,1536,8,128,2,1,power_law_1.01,2.077414321899414
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,4096,1536,8,128,2,1,power_law_1.01,0.9196672439575195
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,4096,1536,8,128,2,1,power_law_1.01,0.4785280227661133
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,4096,1536,8,128,2,1,power_law_1.01,2.595155143737793
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,4096,1536,8,128,2,1,power_law_1.01,1.1289536476135253
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,4096,1536,8,128,2,1,power_law_1.01,0.5180607795715332
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,4096,1536,8,128,2,1,power_law_1.01,3.727276611328125
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,4096,1536,8,128,2,1,power_law_1.01,1.5600831985473633
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,4096,1536,8,128,2,1,balanced,4.52293332417806
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,4096,1536,8,128,2,1,balanced,2.7839574813842773
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,4096,1536,8,128,2,1,balanced,0.5213386615117391
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,4096,1536,8,128,2,1,power_law_1.01,4.794681549072266
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,4096,1536,8,128,2,1,power_law_1.01,1.9815744400024413
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,4096,1536,8,128,2,1,power_law_1.01,0.5337920188903809
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,4096,1536,8,128,2,1,balanced,0.6187413136164347
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,4096,1536,8,128,2,1,power_law_1.01,2.8275007247924804
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,4096,1536,8,128,2,1,power_law_1.01,5.862041473388672
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,4096,1536,8,128,2,1,power_law_1.01,0.6754559993743896
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,4096,1536,8,128,2,1,power_law_1.01,0.7814784049987793
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,4096,1536,8,128,2,1,balanced,0.682042678197225
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,4096,1536,8,128,2,1,power_law_1.01,3.647654342651367
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,4096,1536,8,128,2,1,power_law_1.01,1.0024959564208984
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,4096,1536,8,128,2,1,power_law_1.01,9.075135803222656
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,4096,1536,8,128,2,1,power_law_1.01,1.2340415954589843
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,4096,1536,8,128,2,1,power_law_1.01,4.515232086181641
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,4096,1536,8,128,2,1,balanced,0.9050133228302002
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,4096,1536,8,128,2,1,power_law_1.01,1.6855424880981444
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,4096,1536,8,128,2,1,power_law_1.01,18.5434814453125
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,4096,1536,8,128,2,1,power_law_1.01,2.139423942565918
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,4096,1536,8,128,2,1,power_law_1.01,7.14031982421875
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,4096,1536,8,128,2,1,balanced,1.0511893431345622
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,4096,1536,8,128,2,1,balanced,3.6855732599894204
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,4096,1536,8,128,2,1,power_law_1.01,3.053446388244629
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,4096,1536,8,128,2,1,power_law_1.01,3.947462463378906
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,4096,1536,8,128,2,1,power_law_1.2,0.06255360245704651
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,4096,1536,8,128,2,1,power_law_1.01,14.749095153808593
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,4096,1536,8,128,2,1,balanced,5.675242741902669
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,4096,1536,8,128,2,1,balanced,1.6559359232584636
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,4096,1536,8,128,2,1,power_law_1.01,5.7791999816894535
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,4096,1536,8,128,2,1,power_law_1.2,0.06828160285949707
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,4096,1536,8,128,2,1,power_law_1.2,0.12378879785537719
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,4096,1536,8,128,2,1,power_law_1.01,7.618182373046875
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,4096,1536,8,128,2,1,balanced,1.9580213228861492
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,4096,1536,8,128,2,1,power_law_1.2,0.17731839418411255
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,4096,1536,8,128,2,1,power_law_1.01,9.45959701538086
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,4096,1536,8,128,2,1,power_law_1.2,0.2535167932510376
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,4096,1536,8,128,2,1,power_law_1.2,0.480844783782959
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,4096,1536,8,128,2,1,power_law_1.01,14.980038452148438
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,4096,1536,8,128,2,1,balanced,2.8761278788248696
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,4096,1536,8,128,2,1,balanced,4.5878346761067705
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,4096,1536,8,128,2,1,power_law_1.2,0.5339136123657227
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,4096,1536,8,128,2,1,power_law_1.2,0.5536448001861572
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,4096,1536,8,128,2,1,power_law_1.01,29.758123779296874
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,4096,1536,8,128,2,1,power_law_1.2,0.5595967769622803
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,4096,1536,8,128,2,1,balanced,3.796016057332357
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,4096,1536,8,128,2,1,power_law_1.2,0.5782015800476075
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,4096,1536,8,128,2,1,power_law_1.2,0.5758463859558105
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,4096,1536,8,128,2,1,power_law_1.2,0.6000383853912353
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,4096,1536,8,128,2,1,balanced,9.086032231648764
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,4096,1536,8,128,2,1,power_law_1.2,0.6111680030822754
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,4096,1536,8,128,2,1,power_law_1.2,0.6613632202148437
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,4096,1536,8,128,2,1,power_law_1.2,0.6751103878021241
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,4096,1536,8,128,2,1,balanced,5.626000086466472
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,4096,1536,8,128,2,1,power_law_1.2,0.7233280181884766
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,4096,1536,8,128,2,1,power_law_1.2,0.732428789138794
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,4096,1536,8,128,2,1,power_law_1.2,0.838310432434082
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,4096,1536,8,128,2,1,power_law_1.2,0.8163328170776367
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,4096,1536,8,128,2,1,balanced,7.066837310791016
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,4096,1536,8,128,2,1,power_law_1.2,0.920633602142334
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,4096,1536,8,128,2,1,power_law_1.2,1.059552001953125
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,4096,1536,8,128,2,1,power_law_1.2,1.3340800285339356
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,4096,1536,8,128,2,1,power_law_1.2,1.5788543701171875
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,4096,1536,8,128,2,1,balanced,7.447957356770833
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,4096,1536,8,128,2,1,power_law_1.2,2.1404672622680665
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,4096,1536,8,128,2,1,power_law_1.2,2.671219253540039
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,4096,1536,8,128,2,1,power_law_1.2,3.7721343994140626
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,4096,1536,8,128,2,1,power_law_1.2,4.8641407012939455
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,4096,1536,8,128,2,1,power_law_1.2,5.886515045166016
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,4096,1536,8,128,2,1,power_law_1.2,9.14316177368164
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,4096,1536,8,128,2,1,balanced,9.284357070922852
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,4096,1536,8,128,2,1,power_law_1.2,18.83038787841797
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,4096,1536,8,128,2,1,balanced,18.23748270670573
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,4096,1536,8,128,2,1,power_law_1.2,0.04803839921951294
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,4096,1536,8,128,2,1,balanced,14.071183522542318
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,4096,1536,8,128,2,1,power_law_1.2,0.057894402742385866
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,4096,1536,8,128,2,1,balanced,14.854544321695963
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,4096,1536,8,128,2,1,power_law_1.2,0.08303999900817871
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,4096,1536,8,128,2,1,power_law_1.2,0.10944000482559205
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,4096,1536,8,128,2,1,power_law_1.2,0.14698879718780516
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,4096,1536,8,128,2,1,power_law_1.2,0.26830079555511477
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,4096,1536,8,128,2,1,power_law_1.2,0.2921855926513672
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,4096,1536,8,128,2,1,power_law_1.2,0.29453439712524415
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,4096,1536,8,128,2,1,power_law_1.2,0.3175296068191528
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,4096,1536,8,128,2,1,power_law_1.2,0.32486400604248045
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,4096,1536,8,128,2,1,power_law_1.2,0.33829119205474856
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,4096,1536,8,128,2,1,power_law_1.2,0.35557119846343993
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,4096,1536,8,128,2,1,power_law_1.2,0.37239038944244385
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,4096,1536,8,128,2,1,power_law_1.2,0.3751424074172974
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,4096,1536,8,128,2,1,power_law_1.2,0.39692800045013427
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,4096,1536,8,128,2,1,power_law_1.2,0.41349120140075685
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,4096,1536,8,128,2,1,power_law_1.2,0.42780160903930664
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,4096,1536,8,128,2,1,power_law_1.2,0.4878975868225098
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,4096,1536,8,128,2,1,power_law_1.2,0.5276671886444092
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,4096,1536,8,128,2,1,power_law_1.2,0.6246848106384277
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,4096,1536,8,128,2,1,power_law_1.2,0.7389503955841065
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,4096,1536,8,128,2,1,power_law_1.2,0.9510848045349121
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,4096,1536,8,128,2,1,power_law_1.2,1.1506303787231444
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,4096,1536,8,128,2,1,power_law_1.2,1.5749183654785157
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,4096,1536,8,128,2,1,power_law_1.2,1.9882368087768554
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,4096,1536,8,128,2,1,power_law_1.2,2.829478454589844
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,4096,1536,8,128,2,1,power_law_1.2,3.6721729278564452
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,4096,1536,8,128,2,1,balanced,29.804763793945312
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,4096,1536,8,128,2,1,power_law_1.2,4.50250244140625
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,6144,2560,8,160,1,2,balanced,0.13798933227856955
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,4096,1536,8,128,2,1,power_law_1.2,7.144249725341797
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,6144,2560,8,160,1,2,balanced,0.21966399749120077
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,6144,2560,8,160,1,2,balanced,0.38661332925160724
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,4096,1536,8,128,2,1,power_law_1.2,14.97734375
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,4096,1536,8,128,2,1,power_law_1.2,0.07189760208129883
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,6144,2560,8,160,1,2,balanced,0.7333760261535645
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,6144,2560,8,160,1,2,balanced,1.4250507354736328
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,4096,1536,8,128,2,1,power_law_1.2,0.07489920258522034
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,4096,1536,8,128,2,1,power_law_1.2,0.0987775981426239
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,6144,2560,8,160,1,2,balanced,1.776144027709961
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,4096,1536,8,128,2,1,power_law_1.2,0.12861440181732178
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,6144,2560,8,160,1,2,balanced,1.787482738494873
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,4096,1536,8,128,2,1,power_law_1.2,0.16159360408782958
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,6144,2560,8,160,1,2,balanced,1.7846080462137859
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,4096,1536,8,128,2,1,power_law_1.2,0.2788288116455078
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,6144,2560,8,160,1,2,balanced,1.779685338338216
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,4096,1536,8,128,2,1,power_law_1.2,0.30391678810119627
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,6144,2560,8,160,1,2,balanced,1.7896639506022136
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,6144,2560,8,160,1,2,balanced,0.09450133641560872
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,4096,1536,8,128,2,1,power_law_1.2,0.3247999906539917
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,6144,2560,8,160,1,2,balanced,1.7900106112162273
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,6144,2560,8,160,1,2,balanced,0.13206400473912558
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,4096,1536,8,128,2,1,power_law_1.2,0.3507776021957397
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,6144,2560,8,160,1,2,balanced,0.21541867653528848
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,6144,2560,8,160,1,2,balanced,1.8019466400146484
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,6144,2560,8,160,1,2,balanced,0.3924853404362996
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,4096,1536,8,128,2,1,power_law_1.2,0.35852799415588377
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,6144,2560,8,160,1,2,balanced,0.735525369644165
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,6144,2560,8,160,1,2,balanced,1.8070185979207356
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,4096,1536,8,128,2,1,power_law_1.2,0.3884671926498413
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,6144,2560,8,160,1,2,balanced,0.9206079641977946
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,4096,1536,8,128,2,1,power_law_1.2,0.40855040550231936
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,6144,2560,8,160,1,2,balanced,1.838853359222412
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,6144,2560,8,160,1,2,balanced,0.9162507057189941
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,6144,2560,8,160,1,2,balanced,0.9321386814117432
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,4096,1536,8,128,2,1,power_law_1.2,0.43056640625
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,6144,2560,8,160,1,2,balanced,1.847215970357259
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,6144,2560,8,160,1,2,balanced,0.9355413118998209
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,4096,1536,8,128,2,1,power_law_1.2,0.47606401443481444
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,6144,2560,8,160,1,2,balanced,0.9368533293406168
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,6144,2560,8,160,1,2,balanced,1.8599360783894856
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,6144,2560,8,160,1,2,balanced,0.9382773240407308
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,6144,2560,8,160,1,2,balanced,1.892207940419515
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,6144,2560,8,160,1,2,balanced,0.9489280382792155
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,4096,1536,8,128,2,1,power_law_1.2,0.48942079544067385
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,6144,2560,8,160,1,2,balanced,1.9608640670776367
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,6144,2560,8,160,1,2,balanced,0.9526826540629069
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,4096,1536,8,128,2,1,power_law_1.2,0.5170752048492432
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,6144,2560,8,160,1,2,balanced,0.9666986465454102
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,6144,2560,8,160,1,2,balanced,1.9832693735758464
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,6144,2560,8,160,1,2,balanced,0.9772373040517172
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,6144,2560,8,160,1,2,balanced,0.9869919617970785
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,4096,1536,8,128,2,1,power_law_1.2,0.5460351943969727
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,6144,2560,8,160,1,2,balanced,2.65336004892985
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,6144,2560,8,160,1,2,balanced,1.0138453642527263
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,4096,1536,8,128,2,1,power_law_1.2,0.6712319850921631
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,6144,2560,8,160,1,2,balanced,1.0707253615061443
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,6144,2560,8,160,1,2,balanced,2.1626826922098794
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,4096,1536,8,128,2,1,power_law_1.2,0.7875199794769288
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,6144,2560,8,160,1,2,balanced,1.0775252978007
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,4096,1536,8,128,2,1,power_law_1.2,1.0127103805541993
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,6144,2560,8,160,1,2,balanced,1.5431040128072102
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,4096,1536,8,128,2,1,power_law_1.2,1.2447936058044433
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,6144,2560,8,160,1,2,balanced,4.109530766805013
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,4096,1536,8,128,2,1,power_law_1.2,1.6989952087402345
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,6144,2560,8,160,1,2,balanced,1.219381332397461
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,4096,1536,8,128,2,1,power_law_1.2,2.1473344802856444
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,4096,1536,8,128,2,1,power_law_1.2,3.06296329498291
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,6144,2560,8,160,1,2,balanced,2.1271680196126304
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,6144,2560,8,160,1,2,balanced,2.7877492904663086
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,4096,1536,8,128,2,1,power_law_1.2,3.9613632202148437
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,6144,2560,8,160,1,2,balanced,1.728101412455241
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,4096,1536,8,128,2,1,power_law_1.2,5.800646209716797
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,6144,2560,8,160,1,2,balanced,5.319744110107422
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,4096,1536,8,128,2,1,power_law_1.2,7.615532684326172
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,6144,2560,8,160,1,2,balanced,3.0216852823893228
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,4096,1536,8,128,2,1,power_law_1.2,9.454342651367188
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,4096,1536,8,128,2,1,power_law_1.2,14.947865295410157
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,6144,2560,8,160,1,2,balanced,5.150752067565918
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,6144,2560,8,160,1,2,power_law_1.01,0.2278143882751465
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,6144,2560,8,160,1,2,balanced,0.1030453344186147
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,6144,2560,8,160,1,2,balanced,3.1647520065307617
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,6144,2560,8,160,1,2,power_law_1.01,0.2902656078338623
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,6144,2560,8,160,1,2,balanced,0.14035733540852866
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,6144,2560,8,160,1,2,power_law_1.01,0.3204927921295166
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,6144,2560,8,160,1,2,balanced,0.2408213416735331
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,4096,1536,8,128,2,1,power_law_1.2,29.649151611328126
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,6144,2560,8,160,1,2,balanced,0.40457598368326825
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,6144,2560,8,160,1,2,power_law_1.01,0.547711992263794
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,6144,2560,8,160,1,2,balanced,0.7526186307271322
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,6144,2560,8,160,1,2,power_law_1.01,0.7656320095062256
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,6144,2560,8,160,1,2,balanced,0.9278666973114014
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,6144,2560,8,160,1,2,balanced,6.998821258544922
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,6144,2560,8,160,1,2,power_law_1.01,1.3268416404724122
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,6144,2560,8,160,1,2,balanced,4.624693234761556
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,6144,2560,8,160,1,2,balanced,0.9321599801381429
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,6144,2560,8,160,1,2,power_law_1.01,1.4226304054260255
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,6144,2560,8,160,1,2,balanced,0.9366292953491211
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,6144,2560,8,160,1,2,power_law_1.01,0.12911360263824462
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,6144,2560,8,160,1,2,power_law_1.01,1.5165696144104004
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,6144,2560,8,160,1,2,balanced,0.9382293224334717
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,6144,2560,8,160,1,2,power_law_1.01,0.1623744010925293
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,6144,2560,8,160,1,2,power_law_1.01,1.5352383613586427
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,6144,2560,8,160,1,2,balanced,0.9453866481781006
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,6144,2560,8,160,1,2,power_law_1.01,0.18885120153427123
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,6144,2560,8,160,1,2,power_law_1.01,1.5385663986206055
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,6144,2560,8,160,1,2,balanced,0.956063985824585
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,6144,2560,8,160,1,2,power_law_1.01,0.3057152032852173
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,6144,2560,8,160,1,2,power_law_1.01,1.636832046508789
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,6144,2560,8,160,1,2,balanced,0.9659466743469238
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,6144,2560,8,160,1,2,power_law_1.01,0.4345856189727783
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,6144,2560,8,160,1,2,power_law_1.01,1.6940031051635742
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,6144,2560,8,160,1,2,balanced,5.72053337097168
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,6144,2560,8,160,1,2,balanced,9.202410380045572
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,6144,2560,8,160,1,2,balanced,0.9743680159250895
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,6144,2560,8,160,1,2,power_law_1.01,0.7274367809295654
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,6144,2560,8,160,1,2,power_law_1.01,1.7944511413574218
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,6144,2560,8,160,1,2,balanced,0.9926506678263346
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,6144,2560,8,160,1,2,power_law_1.01,0.7733312129974366
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,6144,2560,8,160,1,2,power_law_1.01,1.671673583984375
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,6144,2560,8,160,1,2,power_law_1.01,0.7875135898590088
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,6144,2560,8,160,1,2,balanced,1.0138453642527263
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,6144,2560,8,160,1,2,power_law_1.01,1.8487232208251954
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,6144,2560,8,160,1,2,power_law_1.01,0.8088000297546387
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,6144,2560,8,160,1,2,power_law_1.01,1.899193572998047
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,6144,2560,8,160,1,2,power_law_1.01,0.8290047645568848
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,6144,2560,8,160,1,2,power_law_1.01,2.029824066162109
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,6144,2560,8,160,1,2,power_law_1.01,0.8989824295043946
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,6144,2560,8,160,1,2,power_law_1.01,0.9360128402709961
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,6144,2560,8,160,1,2,power_law_1.01,2.3255168914794924
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,6144,2560,8,160,1,2,balanced,1.0357653299967449
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,6144,2560,8,160,1,2,power_law_1.01,0.9637887954711915
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,6144,2560,8,160,1,2,power_law_1.01,2.34783992767334
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,6144,2560,8,160,1,2,balanced,6.567685445149739
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,6144,2560,8,160,1,2,power_law_1.01,0.9376640319824219
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,6144,2560,8,160,1,2,power_law_1.01,2.82926082611084
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,6144,2560,8,160,1,2,balanced,10.662837346394857
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,6144,2560,8,160,1,2,power_law_1.01,1.0178239822387696
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,6144,2560,8,160,1,2,power_law_1.01,3.28869743347168
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,6144,2560,8,160,1,2,power_law_1.01,1.0705344200134277
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,6144,2560,8,160,1,2,power_law_1.01,4.045222473144531
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,6144,2560,8,160,1,2,balanced,1.073525349299113
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,6144,2560,8,160,1,2,power_law_1.01,1.058899211883545
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,6144,2560,8,160,1,2,power_law_1.01,4.248582458496093
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,6144,2560,8,160,1,2,power_law_1.01,1.15731201171875
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,6144,2560,8,160,1,2,power_law_1.01,1.2544447898864746
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,6144,2560,8,160,1,2,power_law_1.01,5.387526321411133
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,6144,2560,8,160,1,2,power_law_1.01,1.5750016212463378
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,6144,2560,8,160,1,2,power_law_1.01,6.209363174438477
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,6144,2560,8,160,1,2,power_law_1.01,1.7041791915893554
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,6144,2560,8,160,1,2,power_law_1.01,9.59267807006836
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,6144,2560,8,160,1,2,power_law_1.01,2.152012825012207
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,6144,2560,8,160,1,2,power_law_1.01,2.4351999282836916
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,6144,2560,8,160,1,2,power_law_1.01,10.773133087158204
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,6144,2560,8,160,1,2,balanced,1.185871998469035
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,6144,2560,8,160,1,2,power_law_1.01,3.231436920166016
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,6144,2560,8,160,1,2,balanced,1.2706720034281414
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,6144,2560,8,160,1,2,power_law_1.01,13.856159973144532
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,6144,2560,8,160,1,2,power_law_1.01,3.9108158111572267
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,6144,2560,8,160,1,2,balanced,10.52243169148763
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,6144,2560,8,160,1,2,balanced,1.475935935974121
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,6144,2560,8,160,1,2,power_law_1.01,5.329433441162109
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,6144,2560,8,160,1,2,balanced,17.619839986165363
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,6144,2560,8,160,1,2,power_law_1.01,20.806207275390626
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,6144,2560,8,160,1,2,power_law_1.01,6.468646240234375
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,6144,2560,8,160,1,2,balanced,1.6289547284444172
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,6144,2560,8,160,1,2,power_law_1.2,0.23054718971252441
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,6144,2560,8,160,1,2,power_law_1.01,7.7935234069824215
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,6144,2560,8,160,1,2,balanced,2.505407969156901
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,6144,2560,8,160,1,2,power_law_1.2,0.17011200189590453
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,6144,2560,8,160,1,2,power_law_1.01,0.15119359493255616
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,6144,2560,8,160,1,2,power_law_1.01,41.335943603515624
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,6144,2560,8,160,1,2,power_law_1.01,12.106566619873046
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,6144,2560,8,160,1,2,power_law_1.2,0.25589759349823
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,6144,2560,8,160,1,2,power_law_1.01,0.2214143991470337
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,6144,2560,8,160,1,2,balanced,2.825413386027018
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,6144,2560,8,160,1,2,power_law_1.2,0.5470719814300538
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,6144,2560,8,160,1,2,power_law_1.01,0.18495999574661254
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,6144,2560,8,160,1,2,power_law_1.01,22.680339050292968
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,6144,2560,8,160,1,2,power_law_1.2,0.6962240219116211
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,6144,2560,8,160,1,2,power_law_1.01,0.303385591506958
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,6144,2560,8,160,1,2,power_law_1.2,1.29301118850708
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,6144,2560,8,160,1,2,power_law_1.01,0.4654848098754883
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,6144,2560,8,160,1,2,balanced,4.15342394510905
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,6144,2560,8,160,1,2,power_law_1.01,0.7027647972106934
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,6144,2560,8,160,1,2,power_law_1.2,1.4436927795410157
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,6144,2560,8,160,1,2,power_law_1.2,1.6102783203125
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,6144,2560,8,160,1,2,power_law_1.01,0.7543551921844482
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,6144,2560,8,160,1,2,power_law_1.01,0.7671103954315186
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,6144,2560,8,160,1,2,power_law_1.2,1.590681552886963
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,6144,2560,8,160,1,2,power_law_1.01,0.8058048248291015
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,6144,2560,8,160,1,2,power_law_1.2,1.632204818725586
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,6144,2560,8,160,1,2,balanced,5.521711985270183
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,6144,2560,8,160,1,2,power_law_1.01,0.8535103797912598
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,6144,2560,8,160,1,2,power_law_1.2,1.7428159713745117
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,6144,2560,8,160,1,2,power_law_1.01,0.9241151809692383
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,6144,2560,8,160,1,2,power_law_1.2,1.7993728637695312
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,6144,2560,8,160,1,2,power_law_1.01,0.9782784461975098
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,6144,2560,8,160,1,2,power_law_1.2,1.8162879943847656
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,6144,2560,8,160,1,2,power_law_1.01,1.032691192626953
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,6144,2560,8,160,1,2,power_law_1.2,1.8809343338012696
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,6144,2560,8,160,1,2,balanced,7.714805603027344
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,6144,2560,8,160,1,2,power_law_1.01,1.1909119606018066
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,6144,2560,8,160,1,2,power_law_1.2,1.9737983703613282
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,6144,2560,8,160,1,2,power_law_1.01,1.2475839614868165
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,6144,2560,8,160,1,2,power_law_1.2,2.040115165710449
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,6144,2560,8,160,1,2,power_law_1.2,2.1302911758422853
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,6144,2560,8,160,1,2,power_law_1.2,2.5078847885131834
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,6144,2560,8,160,1,2,power_law_1.01,1.1727616310119628
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,6144,2560,8,160,1,2,balanced,20.59939193725586
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,6144,2560,8,160,1,2,power_law_1.2,2.4691583633422853
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,6144,2560,8,160,1,2,power_law_1.2,3.1275455474853517
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,6144,2560,8,160,1,2,power_law_1.01,1.2679807662963867
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,6144,2560,8,160,1,2,balanced,34.00682576497396
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,6144,2560,8,160,1,2,balanced,10.608778635660807
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,6144,2560,8,160,1,2,power_law_1.2,3.3928062438964846
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,6144,2560,8,160,1,2,power_law_1.2,4.195923233032227
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,6144,2560,8,160,1,2,power_law_1.2,4.498163223266602
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,6144,2560,8,160,1,2,power_law_1.01,1.3560511589050293
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,6144,2560,8,160,1,2,power_law_1.01,1.586944007873535
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,6144,2560,8,160,1,2,power_law_1.2,5.838937759399414
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,6144,2560,8,160,1,2,power_law_1.01,1.7454912185668945
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,6144,2560,8,160,1,2,power_law_1.2,6.53088607788086
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,6144,2560,8,160,1,2,power_law_1.01,2.086528015136719
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,6144,2560,8,160,1,2,power_law_1.01,2.565068817138672
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,6144,2560,8,160,1,2,power_law_1.2,9.189926147460938
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,6144,2560,8,160,1,2,balanced,12.740538279215494
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,6144,2560,8,160,1,2,power_law_1.01,3.5042751312255858
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,6144,2560,8,160,1,2,power_law_1.2,12.292985534667968
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,6144,2560,8,160,1,2,power_law_1.01,4.882508850097656
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,6144,2560,8,160,1,2,power_law_1.01,5.910099029541016
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,6144,2560,8,160,1,2,power_law_1.2,14.847482299804687
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,6144,2560,8,160,1,2,power_law_1.01,9.212531280517577
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,6144,2560,8,160,1,2,power_law_1.2,21.25293426513672
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,6144,2560,8,160,1,2,power_law_1.01,12.120832061767578
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,6144,2560,8,160,1,2,power_law_1.2,0.13992960453033448
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,6144,2560,8,160,1,2,power_law_1.01,14.427839660644532
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,6144,2560,8,160,1,2,power_law_1.2,0.1201856017112732
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,6144,2560,8,160,1,2,power_law_1.2,44.01111755371094
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,6144,2560,8,160,1,2,power_law_1.2,0.15665279626846312
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,6144,2560,8,160,1,2,power_law_1.01,25.436607360839844
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,6144,2560,8,160,1,2,power_law_1.2,0.271833610534668
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,6144,2560,8,160,1,2,power_law_1.2,0.3682687997817993
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,6144,2560,8,160,1,2,balanced,21.200149536132812
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,6144,2560,8,160,1,2,power_law_1.2,0.6612544059753418
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,6144,2560,8,160,1,2,power_law_1.01,45.061761474609376
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,6144,2560,8,160,1,2,power_law_1.2,0.7313536167144775
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,6144,2560,8,160,1,2,power_law_1.2,0.7925951957702637
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,6144,2560,8,160,1,2,power_law_1.2,0.8405376434326172
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,6144,2560,8,160,1,2,power_law_1.2,0.8683391571044922
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,6144,2560,8,160,1,2,power_law_1.2,0.9448703765869141
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,6144,2560,8,160,1,2,power_law_1.2,0.9869119644165039
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,6144,2560,8,160,1,2,power_law_1.2,1.0156607627868652
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,6144,2560,8,160,1,2,power_law_1.2,1.013043212890625
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,6144,2560,8,160,1,2,power_law_1.2,1.0337663650512696
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,6144,2560,8,160,1,2,power_law_1.2,1.084006404876709
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,6144,2560,8,160,1,2,power_law_1.2,1.0820480346679688
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,6144,2560,8,160,1,2,power_law_1.2,1.2423871994018554
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,6144,2560,8,160,1,2,power_law_1.2,1.3439488410949707
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,6144,2560,8,160,1,2,power_law_1.2,1.619923210144043
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,6144,2560,8,160,1,2,power_law_1.2,1.7966144561767579
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,6144,2560,8,160,1,2,power_law_1.2,2.191142463684082
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,6144,2560,8,160,1,2,power_law_1.2,2.6616447448730467
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,6144,2560,8,160,1,2,power_law_1.2,3.2842559814453125
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,6144,2560,8,160,1,2,power_law_1.2,4.05140495300293
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,6144,2560,8,160,1,2,balanced,43.238789876302086
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,6144,2560,8,160,1,2,power_law_1.2,5.71283187866211
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,6144,2560,8,160,1,2,power_law_1.2,6.480121612548828
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,6144,2560,8,160,1,2,power_law_1.2,9.234086608886718
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,6144,2560,8,160,1,2,power_law_1.2,0.1504639983177185
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,6144,2560,8,160,1,2,power_law_1.2,0.11413760185241699
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,6144,2560,8,160,1,2,power_law_1.2,12.139615631103515
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,6144,2560,8,160,1,2,power_law_1.2,0.18537600040435792
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,6144,2560,8,160,1,2,power_law_1.2,0.2944191932678223
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,6144,2560,8,160,1,2,power_law_1.2,25.41260223388672
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,6144,2560,8,160,1,2,power_law_1.2,0.39232640266418456
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,6144,2560,8,160,2,1,balanced,0.13664000233014426
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,6144,2560,8,160,1,2,power_law_1.2,0.7107327938079834
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,6144,2560,8,160,2,1,balanced,0.21438932418823242
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,6144,2560,8,160,1,2,power_law_1.2,0.761568021774292
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,6144,2560,8,160,2,1,balanced,0.38766932487487793
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,6144,2560,8,160,1,2,power_law_1.2,0.8023360252380372
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,6144,2560,8,160,2,1,balanced,0.7333333492279053
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,6144,2560,8,160,1,2,power_law_1.2,0.8254528045654297
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,6144,2560,8,160,2,1,balanced,1.4210294087727864
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,6144,2560,8,160,1,2,power_law_1.2,0.8961152076721192
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,6144,2560,8,160,2,1,balanced,1.7968053817749023
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,6144,2560,8,160,1,2,power_law_1.2,0.9728960037231446
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,6144,2560,8,160,2,1,balanced,1.7987039883931477
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,6144,2560,8,160,1,2,power_law_1.2,1.0515456199645996
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,6144,2560,8,160,2,1,balanced,1.8011520703633626
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,6144,2560,8,160,1,2,power_law_1.2,1.098566436767578
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,6144,2560,8,160,2,1,balanced,1.8020373980204265
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,6144,2560,8,160,1,2,power_law_1.2,1.2298303604125977
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,6144,2560,8,160,2,1,balanced,1.8165225982666016
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,6144,2560,8,160,1,2,power_law_1.2,1.2674688339233398
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,6144,2560,8,160,2,1,balanced,1.8210080464680989
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,6144,2560,8,160,2,1,balanced,1.8299573262532551
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,6144,2560,8,160,2,1,balanced,1.8370505968729656
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,6144,2560,8,160,1,2,power_law_1.2,1.2273344039916991
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,6144,2560,8,160,2,1,balanced,0.09410132964452107
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,6144,2560,8,160,2,1,balanced,1.8575092951456706
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,6144,2560,8,160,2,1,balanced,0.13053866227467856
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,6144,2560,8,160,2,1,balanced,1.8719520568847656
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,6144,2560,8,160,2,1,balanced,0.21561066309611002
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,6144,2560,8,160,2,1,balanced,1.9353866577148438
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,6144,2560,8,160,1,2,power_law_1.2,1.308512020111084
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,6144,2560,8,160,2,1,balanced,0.39584533373514813
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,6144,2560,8,160,2,1,balanced,0.7479413350423177
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,6144,2560,8,160,2,1,balanced,1.938421408335368
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,6144,2560,8,160,2,1,balanced,0.91866135597229
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,6144,2560,8,160,2,1,balanced,1.998576005299886
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,6144,2560,8,160,1,2,power_law_1.2,1.3931903839111328
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,6144,2560,8,160,2,1,balanced,0.9252479871114095
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,6144,2560,8,160,2,1,balanced,0.11826133728027344
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,6144,2560,8,160,2,1,balanced,0.9303733507792155
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,6144,2560,8,160,2,1,balanced,2.024442672729492
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,6144,2560,8,160,1,2,power_law_1.2,1.65020809173584
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,6144,2560,8,160,2,1,balanced,0.15506133437156677
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,6144,2560,8,160,2,1,balanced,0.9343573252360026
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,6144,2560,8,160,1,2,power_law_1.2,1.8151296615600585
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,6144,2560,8,160,2,1,balanced,2.8458827336629233
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,6144,2560,8,160,2,1,balanced,0.2529226740201314
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,6144,2560,8,160,2,1,balanced,0.9432426293691
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,6144,2560,8,160,1,2,power_law_1.2,2.19116153717041
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,6144,2560,8,160,2,1,balanced,0.4152853488922119
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,6144,2560,8,160,2,1,balanced,0.9535199801127116
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,6144,2560,8,160,2,1,balanced,2.2994186083475747
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,6144,2560,8,160,1,2,power_law_1.2,2.7687679290771485
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,6144,2560,8,160,2,1,balanced,0.768122673034668
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,6144,2560,8,160,2,1,balanced,0.9583626588185629
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,6144,2560,8,160,2,1,balanced,0.9465173085530599
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,6144,2560,8,160,1,2,power_law_1.2,3.357331085205078
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,6144,2560,8,160,2,1,balanced,0.9725013573964437
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,6144,2560,8,160,2,1,balanced,0.9528373082478842
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,6144,2560,8,160,2,1,balanced,4.077664057413737
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,6144,2560,8,160,1,2,power_law_1.2,5.012160110473633
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,6144,2560,8,160,2,1,balanced,0.9632960160573324
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,6144,2560,8,160,2,1,balanced,0.9907946586608887
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,6144,2560,8,160,1,2,power_law_1.2,6.521145629882812
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,6144,2560,8,160,2,1,balanced,0.9719733397165934
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,6144,2560,8,160,2,1,balanced,1.006666660308838
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,6144,2560,8,160,2,1,balanced,3.021648089090983
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,6144,2560,8,160,2,1,balanced,0.9754613240559896
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,6144,2560,8,160,2,1,balanced,1.0203306674957275
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,6144,2560,8,160,1,2,power_law_1.2,8.78253402709961
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,6144,2560,8,160,2,1,balanced,0.9886026382446289
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,6144,2560,8,160,2,1,balanced,1.0441546440124512
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,6144,2560,8,160,2,1,balanced,1.0071893533070881
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,6144,2560,8,160,1,2,power_law_1.2,13.200076293945312
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,6144,2560,8,160,2,1,balanced,5.462005615234375
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,6144,2560,8,160,2,1,balanced,1.2655413150787354
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,6144,2560,8,160,2,1,balanced,1.0230186780293782
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,6144,2560,8,160,2,1,balanced,1.0509973367055256
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,6144,2560,8,160,2,1,power_law_1.01,0.12357759475708008
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,6144,2560,8,160,2,1,balanced,1.1645759741465251
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,6144,2560,8,160,1,2,power_law_1.2,14.607685852050782
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,6144,2560,8,160,2,1,balanced,1.0889920393625896
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,6144,2560,8,160,2,1,power_law_1.01,0.19192960262298583
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,6144,2560,8,160,2,1,balanced,1.3425119717915852
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,6144,2560,8,160,2,1,power_law_1.01,0.2792831897735596
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,6144,2560,8,160,2,1,balanced,5.595706939697266
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,6144,2560,8,160,1,2,power_law_1.2,24.49183349609375
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,6144,2560,8,160,2,1,power_law_1.01,0.49308161735534667
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,6144,2560,8,160,2,1,balanced,1.3737866083780925
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,6144,2560,8,160,2,1,power_law_1.01,0.7499135971069336
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,6144,2560,8,160,2,1,balanced,1.126912037531535
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,6144,2560,8,160,2,1,power_law_1.01,0.09400960206985473
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,6144,2560,8,160,2,1,power_law_1.01,1.327455997467041
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,6144,2560,8,160,2,1,balanced,2.1679466565450034
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,6144,2560,8,160,2,1,power_law_1.01,1.4333824157714843
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,6144,2560,8,160,2,1,power_law_1.01,0.1178879976272583
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,6144,2560,8,160,1,2,power_law_1.2,54.51362915039063
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,6144,2560,8,160,2,1,power_law_1.01,0.17359999418258668
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,6144,2560,8,160,2,1,power_law_1.01,1.4873344421386718
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,6144,2560,8,160,2,1,balanced,8.422159830729166
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,6144,2560,8,160,2,1,balanced,1.9992106755574544
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,6144,2560,8,160,2,1,power_law_1.01,0.27783679962158203
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,6144,2560,8,160,2,1,power_law_1.01,1.5553279876708985
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,6144,2560,8,160,2,1,balanced,1.201584021250407
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,6144,2560,8,160,2,1,power_law_1.01,0.4071360111236572
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,6144,2560,8,160,2,1,power_law_1.01,1.5849663734436035
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,6144,2560,8,160,2,1,power_law_1.01,0.6910912036895752
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,6144,2560,8,160,2,1,power_law_1.01,1.5895039558410644
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,6144,2560,8,160,2,1,power_law_1.01,0.7611455917358398
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,6144,2560,8,160,2,1,balanced,3.474586804707845
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,6144,2560,8,160,2,1,power_law_1.01,0.7846911907196045
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,6144,2560,8,160,2,1,power_law_1.01,1.6492927551269532
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,6144,2560,8,160,2,1,power_law_1.01,0.8225919723510742
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,6144,2560,8,160,2,1,power_law_1.01,1.675276756286621
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,6144,2560,8,160,2,1,power_law_1.01,0.8160896301269531
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,6144,2560,8,160,2,1,power_law_1.01,1.7524160385131835
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,6144,2560,8,160,2,1,balanced,9.946933110555014
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,6144,2560,8,160,2,1,power_law_1.01,0.8651904106140137
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,6144,2560,8,160,2,1,balanced,3.746272087097168
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,6144,2560,8,160,2,1,balanced,1.3879146575927734
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,6144,2560,8,160,2,1,power_law_1.01,1.8190847396850587
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,6144,2560,8,160,2,1,power_law_1.01,0.8863103866577149
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,6144,2560,8,160,2,1,power_law_1.01,1.893414306640625
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,6144,2560,8,160,2,1,power_law_1.01,0.9136063575744628
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,6144,2560,8,160,2,1,balanced,1.5226772626241047
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,6144,2560,8,160,2,1,power_law_1.01,1.9382144927978515
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,6144,2560,8,160,2,1,power_law_1.01,0.9372480392456055
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,6144,2560,8,160,2,1,power_law_1.01,2.1678655624389647
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,6144,2560,8,160,2,1,power_law_1.01,0.959552001953125
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,6144,2560,8,160,2,1,balanced,1.8177439371744792
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,6144,2560,8,160,2,1,power_law_1.01,1.001369571685791
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,6144,2560,8,160,2,1,power_law_1.01,2.5658111572265625
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,6144,2560,8,160,2,1,power_law_1.01,1.0541119575500488
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,6144,2560,8,160,2,1,balanced,5.1578718821207685
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,6144,2560,8,160,2,1,power_law_1.01,3.2191680908203124
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,6144,2560,8,160,2,1,power_law_1.01,1.2020352363586426
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,6144,2560,8,160,2,1,balanced,2.086282730102539
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,6144,2560,8,160,2,1,power_law_1.01,3.358278274536133
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,6144,2560,8,160,2,1,power_law_1.01,1.2827903747558593
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,6144,2560,8,160,2,1,balanced,11.519242604573568
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,6144,2560,8,160,2,1,power_law_1.01,1.5174464225769042
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,6144,2560,8,160,2,1,power_law_1.01,4.285030364990234
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,6144,2560,8,160,2,1,balanced,3.1911627451578775
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,6144,2560,8,160,2,1,power_law_1.01,1.6228544235229492
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,6144,2560,8,160,2,1,power_law_1.01,4.352268981933594
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,6144,2560,8,160,2,1,power_law_1.01,2.0613119125366213
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,6144,2560,8,160,2,1,power_law_1.01,5.350643157958984
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,6144,2560,8,160,2,1,balanced,3.7504746119181314
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,6144,2560,8,160,2,1,power_law_1.01,2.6649728775024415
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,6144,2560,8,160,2,1,power_law_1.01,0.1251904010772705
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,6144,2560,8,160,2,1,power_law_1.01,3.389158248901367
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,6144,2560,8,160,2,1,power_law_1.01,6.427724456787109
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,6144,2560,8,160,2,1,balanced,6.820410410563151
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,6144,2560,8,160,2,1,power_law_1.01,0.15055999755859376
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,6144,2560,8,160,2,1,power_law_1.01,3.9664894104003907
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,6144,2560,8,160,2,1,power_law_1.01,8.647411346435547
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,6144,2560,8,160,2,1,balanced,5.643781026204427
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,6144,2560,8,160,2,1,power_law_1.01,0.19120639562606812
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,6144,2560,8,160,2,1,power_law_1.01,5.444063949584961
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,6144,2560,8,160,2,1,power_law_1.01,0.32620160579681395
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,6144,2560,8,160,2,1,power_law_1.01,10.950975799560547
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,6144,2560,8,160,2,1,power_law_1.01,7.038233947753906
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,6144,2560,8,160,2,1,power_law_1.01,0.42062082290649416
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,6144,2560,8,160,2,1,power_law_1.01,13.668998718261719
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,6144,2560,8,160,2,1,power_law_1.01,0.7023039817810058
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,6144,2560,8,160,2,1,power_law_1.01,8.695616149902344
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,6144,2560,8,160,2,1,balanced,7.4799149831136065
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,6144,2560,8,160,2,1,power_law_1.01,0.7872191905975342
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,6144,2560,8,160,2,1,power_law_1.01,0.7966591835021972
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,6144,2560,8,160,2,1,power_law_1.01,13.544230651855468
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,6144,2560,8,160,2,1,power_law_1.01,19.609414672851564
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,6144,2560,8,160,2,1,balanced,19.475296020507812
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,6144,2560,8,160,2,1,power_law_1.01,0.8470848083496094
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,6144,2560,8,160,2,1,balanced,8.371327718098959
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,6144,2560,8,160,2,1,power_law_1.01,0.8714559555053711
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,6144,2560,8,160,2,1,power_law_1.2,0.12324479818344117
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,6144,2560,8,160,2,1,power_law_1.01,25.2271484375
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,6144,2560,8,160,2,1,power_law_1.01,0.9443519592285157
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,6144,2560,8,160,2,1,power_law_1.2,0.15623680353164673
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,6144,2560,8,160,2,1,power_law_1.01,38.160595703125
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,6144,2560,8,160,2,1,power_law_1.01,1.0080512046813965
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,6144,2560,8,160,2,1,balanced,10.594709396362305
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,6144,2560,8,160,2,1,power_law_1.2,0.28155519962310793
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,6144,2560,8,160,2,1,power_law_1.01,1.089510440826416
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,6144,2560,8,160,2,1,power_law_1.2,0.46197757720947263
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,6144,2560,8,160,2,1,power_law_1.2,0.6536128044128418
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,6144,2560,8,160,2,1,power_law_1.01,1.173299217224121
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,6144,2560,8,160,2,1,power_law_1.2,1.3087167739868164
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,6144,2560,8,160,2,1,power_law_1.01,1.3052096366882324
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,6144,2560,8,160,2,1,power_law_1.2,1.423142433166504
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,6144,2560,8,160,2,1,power_law_1.2,1.4948991775512694
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,6144,2560,8,160,2,1,power_law_1.2,1.5767231941223145
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,6144,2560,8,160,2,1,power_law_1.01,1.2731328010559082
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,6144,2560,8,160,2,1,power_law_1.2,1.6032960891723633
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,6144,2560,8,160,2,1,power_law_1.2,1.6708671569824218
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,6144,2560,8,160,2,1,power_law_1.2,1.7027584075927735
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,6144,2560,8,160,2,1,balanced,14.344239552815756
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,6144,2560,8,160,2,1,power_law_1.2,1.7542463302612306
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,6144,2560,8,160,2,1,power_law_1.01,1.3974207878112792
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,6144,2560,8,160,2,1,power_law_1.2,1.8568511962890626
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,6144,2560,8,160,2,1,power_law_1.2,1.8947391510009766
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,6144,2560,8,160,2,1,balanced,13.019306182861328
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,6144,2560,8,160,2,1,power_law_1.01,1.5123007774353028
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,6144,2560,8,160,2,1,power_law_1.2,1.9578304290771484
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,6144,2560,8,160,2,1,power_law_1.01,1.7814592361450194
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,6144,2560,8,160,2,1,power_law_1.2,1.994156837463379
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,6144,2560,8,160,2,1,power_law_1.2,2.2635967254638674
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,6144,2560,8,160,2,1,power_law_1.01,2.009247970581055
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,6144,2560,8,160,2,1,power_law_1.2,2.690771293640137
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,6144,2560,8,160,2,1,power_law_1.01,2.3914432525634766
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,6144,2560,8,160,2,1,power_law_1.2,3.258444976806641
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,6144,2560,8,160,2,1,power_law_1.01,3.188057518005371
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,6144,2560,8,160,2,1,power_law_1.2,3.4371711730957033
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,6144,2560,8,160,2,1,balanced,17.23419698079427
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,6144,2560,8,160,2,1,power_law_1.01,3.992620849609375
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,6144,2560,8,160,2,1,power_law_1.2,4.2728321075439455
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,6144,2560,8,160,2,1,power_law_1.01,5.606975936889649
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,6144,2560,8,160,2,1,power_law_1.2,4.4377281188964846
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,6144,2560,8,160,2,1,power_law_1.2,5.443667221069336
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,6144,2560,8,160,2,1,power_law_1.01,7.264211273193359
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,6144,2560,8,160,2,1,power_law_1.2,6.574655914306641
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,6144,2560,8,160,2,1,power_law_1.01,10.594258880615234
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,6144,2560,8,160,2,1,power_law_1.2,8.693138885498048
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,6144,2560,8,160,2,1,balanced,37.34374491373698
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,6144,2560,8,160,2,1,power_law_1.2,11.291629028320312
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,6144,2560,8,160,2,1,power_law_1.01,13.889581298828125
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,6144,2560,8,160,2,1,power_law_1.2,13.868876647949218
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,6144,2560,8,160,2,1,power_law_1.01,17.367327880859374
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,6144,2560,8,160,2,1,power_law_1.2,19.688064575195312
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,6144,2560,8,160,2,1,power_law_1.01,27.414047241210938
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,6144,2560,8,160,2,1,balanced,28.468505859375
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,6144,2560,8,160,2,1,power_law_1.2,38.67760009765625
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,6144,2560,8,160,2,1,power_law_1.01,55.421600341796875
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,6144,2560,8,160,2,1,balanced,25.02423350016276
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,6144,2560,8,160,2,1,power_law_1.2,0.09331200122833253
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,6144,2560,8,160,2,1,power_law_1.2,0.09686400294303894
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,6144,2560,8,160,2,1,power_law_1.2,0.1474176049232483
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,6144,2560,8,160,2,1,power_law_1.2,0.25727999210357666
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,6144,2560,8,160,2,1,power_law_1.2,0.364851188659668
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,6144,2560,8,160,2,1,power_law_1.2,0.6910848140716552
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,6144,2560,8,160,2,1,power_law_1.2,0.7520319938659668
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,6144,2560,8,160,2,1,power_law_1.2,0.7830080032348633
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,6144,2560,8,160,2,1,power_law_1.2,0.8243776321411133
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,6144,2560,8,160,2,1,power_law_1.2,0.8524800300598144
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,6144,2560,8,160,2,1,power_law_1.2,0.8757568359375
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,6144,2560,8,160,2,1,power_law_1.2,0.9211584091186523
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,6144,2560,8,160,2,1,power_law_1.2,0.9452287673950195
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,6144,2560,8,160,2,1,power_law_1.2,0.9644543647766113
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,6144,2560,8,160,2,1,power_law_1.2,1.0084992408752442
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,6144,2560,8,160,2,1,balanced,58.15380350748698
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,6144,2560,8,160,2,1,power_law_1.2,1.0436927795410156
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,6144,2560,8,160,2,1,power_law_1.2,1.08274564743042
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,6144,2560,8,160,2,1,power_law_1.2,1.2549504280090331
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,6144,2560,8,160,2,1,power_law_1.2,1.3206720352172852
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,6144,2560,8,160,2,1,power_law_1.2,1.5595264434814453
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,6144,2560,8,160,2,1,power_law_1.2,1.6891904830932618
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,6144,2560,8,160,2,1,power_law_1.2,2.1184640884399415
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,6144,2560,8,160,2,1,power_law_1.2,2.7172096252441404
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,6144,2560,8,160,2,1,power_law_1.2,3.480051040649414
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,6144,2560,8,160,2,1,power_law_1.2,4.066963195800781
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,6144,2560,8,160,2,1,power_law_1.2,5.5758720397949215
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,6144,2560,8,160,2,1,power_law_1.2,7.2878974914550785
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,6144,2560,8,160,2,1,power_law_1.2,0.12434560060501099
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,6144,2560,8,160,2,1,power_law_1.2,8.971852874755859
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,6144,2560,8,160,2,1,power_law_1.2,0.1286463975906372
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,6144,2560,8,160,2,1,power_law_1.2,0.19103360176086426
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,6144,2560,8,160,2,1,power_law_1.2,13.617984008789062
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,7168,2048,8,384,1,2,balanced,0.13260266184806824
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,6144,2560,8,160,2,1,power_law_1.2,0.2654848098754883
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,7168,2048,8,384,1,2,balanced,0.19985065857569376
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,6144,2560,8,160,2,1,power_law_1.2,0.36417279243469236
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,7168,2048,8,384,1,2,balanced,0.36051734288533527
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,6144,2560,8,160,2,1,power_law_1.2,25.274534606933592
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,6144,2560,8,160,2,1,power_law_1.2,0.7385024070739746
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,7168,2048,8,384,1,2,balanced,0.6906720002492269
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,7168,2048,8,384,1,2,balanced,1.3453973134358723
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,6144,2560,8,160,2,1,power_law_1.2,0.7818751811981202
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,7168,2048,8,384,1,2,balanced,2.641530672709147
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,6144,2560,8,160,2,1,power_law_1.2,0.8316096305847168
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,7168,2048,8,384,1,2,balanced,3.9470720291137695
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,7168,2048,8,384,1,2,balanced,4.002442677815755
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,6144,2560,8,160,2,1,power_law_1.2,0.8762304306030273
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,7168,2048,8,384,1,2,balanced,3.971797307332357
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,6144,2560,8,160,2,1,power_law_1.2,0.9011712074279785
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,7168,2048,8,384,1,2,balanced,3.986703872680664
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,7168,2048,8,384,1,2,balanced,3.9433066050211587
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,6144,2560,8,160,2,1,power_law_1.2,0.9720383644104004
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,7168,2048,8,384,1,2,balanced,3.958042780558268
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,6144,2560,8,160,2,1,power_law_1.2,1.0324480056762695
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,7168,2048,8,384,1,2,balanced,3.954400062561035
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,6144,2560,8,160,2,1,power_law_1.2,1.0995967864990235
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,7168,2048,8,384,1,2,balanced,3.9917173385620117
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,6144,2560,8,160,2,1,power_law_1.2,1.212831974029541
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,7168,2048,8,384,1,2,balanced,3.988719940185547
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,6144,2560,8,160,2,1,power_law_1.2,1.3301888465881349
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,7168,2048,8,384,1,2,balanced,4.01580810546875
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,7168,2048,8,384,1,2,balanced,4.041034698486328
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,6144,2560,8,160,2,1,power_law_1.2,1.3120127677917481
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,7168,2048,8,384,1,2,balanced,4.096138636271159
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,7168,2048,8,384,1,2,balanced,4.223855972290039
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,6144,2560,8,160,2,1,power_law_1.2,1.4004096031188964
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,7168,2048,8,384,1,2,balanced,4.346447944641113
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,7168,2048,8,384,1,2,balanced,4.382218678792317
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,6144,2560,8,160,2,1,power_law_1.2,1.5697279930114747
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,7168,2048,8,384,1,2,balanced,4.561274528503418
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,7168,2048,8,384,1,2,balanced,0.0888853371143341
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,6144,2560,8,160,2,1,power_law_1.2,1.8071680068969727
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,7168,2048,8,384,1,2,balanced,0.12433600425720215
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,6144,2560,8,160,2,1,power_law_1.2,2.0519039154052736
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,7168,2048,8,384,1,2,balanced,4.898341178894043
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,7168,2048,8,384,1,2,balanced,0.20403732856114706
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,6144,2560,8,160,2,1,power_law_1.2,2.443891143798828
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,7168,2048,8,384,1,2,balanced,0.3703146775563558
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,6144,2560,8,160,2,1,power_law_1.2,3.231916809082031
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,7168,2048,8,384,1,2,balanced,0.6928479671478271
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,6144,2560,8,160,2,1,power_law_1.2,4.019379043579102
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,7168,2048,8,384,1,2,balanced,5.1717227300008135
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,7168,2048,8,384,1,2,balanced,1.3574453989664714
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,6144,2560,8,160,2,1,power_law_1.2,5.631135940551758
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,7168,2048,8,384,1,2,balanced,1.9907466570536296
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,7168,2048,8,384,1,2,balanced,2.0009973843892417
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,6144,2560,8,160,2,1,power_law_1.2,7.285561370849609
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,7168,2048,8,384,1,2,balanced,1.9948533376057942
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,7168,2048,8,384,1,2,balanced,6.422122955322266
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,7168,2048,8,384,1,2,balanced,2.005589326222738
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,6144,2560,8,160,2,1,power_law_1.2,10.611373138427734
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,7168,2048,8,384,1,2,balanced,2.0048160552978516
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,7168,2048,8,384,1,2,balanced,2.009413401285807
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,6144,2560,8,160,2,1,power_law_1.2,13.80435791015625
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,7168,2048,8,384,1,2,balanced,2.0181387265523276
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,7168,2048,8,384,1,2,balanced,0.12306666374206543
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,7168,2048,8,384,1,2,balanced,2.03767999013265
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,6144,2560,8,160,2,1,power_law_1.2,17.13981475830078
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,7168,2048,8,384,1,2,balanced,6.7749176025390625
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,7168,2048,8,384,1,2,balanced,0.15744533141454062
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,7168,2048,8,384,1,2,power_law_1.01,0.13341439962387086
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,7168,2048,8,384,1,2,balanced,2.0552053451538086
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,7168,2048,8,384,1,2,power_law_1.01,0.20217599868774414
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,7168,2048,8,384,1,2,balanced,0.2445440093676249
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,7168,2048,8,384,1,2,balanced,2.071887969970703
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,7168,2048,8,384,1,2,power_law_1.01,0.2035072088241577
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,6144,2560,8,160,2,1,power_law_1.2,27.274374389648436
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,7168,2048,8,384,1,2,balanced,0.408463994661967
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,7168,2048,8,384,1,2,power_law_1.01,0.3602688074111938
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,7168,2048,8,384,1,2,balanced,2.09554131825765
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,7168,2048,8,384,1,2,power_law_1.01,0.36426239013671874
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,7168,2048,8,384,1,2,balanced,0.7180639902750651
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,7168,2048,8,384,1,2,power_law_1.01,0.6842559814453125
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,7168,2048,8,384,1,2,power_law_1.01,0.2780416011810303
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,7168,2048,8,384,1,2,balanced,2.1574880282084146
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,7168,2048,8,384,1,2,balanced,1.3623894055684407
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,7168,2048,8,384,1,2,power_law_1.01,0.4875328063964844
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,7168,2048,8,384,1,2,power_law_1.01,0.5448383808135986
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,7168,2048,8,384,1,2,balanced,2.0053332646687827
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,7168,2048,8,384,1,2,balanced,2.2026880582173667
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,7168,2048,8,384,1,2,power_law_1.01,1.0017087936401368
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,7168,2048,8,384,1,2,balanced,2.003647963205973
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,6144,2560,8,160,2,1,power_law_1.2,54.6450439453125
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,7168,2048,8,384,1,2,power_law_1.01,0.8087743759155274
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,7168,2048,8,384,1,2,balanced,9.402042388916016
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,7168,2048,8,384,1,2,power_law_1.01,1.45863037109375
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,7168,2048,8,384,1,2,balanced,2.299839973449707
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,7168,2048,8,384,1,2,balanced,2.014570713043213
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,7168,2048,8,384,1,2,power_law_1.01,0.9353023529052734
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,7168,2048,8,384,1,2,power_law_1.01,1.8996160507202149
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,7168,2048,8,384,1,2,balanced,2.0172853469848633
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,7168,2048,8,384,1,2,power_law_1.01,1.2437312126159668
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,7168,2048,8,384,1,2,balanced,2.343557357788086
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,7168,2048,8,384,1,2,power_law_1.01,2.3670976638793944
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,7168,2048,8,384,1,2,balanced,2.0267200469970703
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,7168,2048,8,384,1,2,power_law_1.01,1.2960384368896485
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,7168,2048,8,384,1,2,power_law_1.01,2.634867286682129
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,7168,2048,8,384,1,2,balanced,2.034426689147949
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,7168,2048,8,384,1,2,balanced,2.4966185887654624
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,7168,2048,8,384,1,2,power_law_1.01,1.3575551986694336
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,7168,2048,8,384,1,2,power_law_1.01,2.695577621459961
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,7168,2048,8,384,1,2,balanced,2.0462400118509927
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,7168,2048,8,384,1,2,power_law_1.01,1.470355224609375
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,7168,2048,8,384,1,2,balanced,2.062101364135742
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,7168,2048,8,384,1,2,power_law_1.01,2.81014404296875
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,7168,2048,8,384,1,2,balanced,2.685509363810221
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,7168,2048,8,384,1,2,power_law_1.01,1.4820992469787597
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,7168,2048,8,384,1,2,balanced,2.089786688486735
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,7168,2048,8,384,1,2,power_law_1.01,2.8868991851806642
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,7168,2048,8,384,1,2,balanced,14.165140787760416
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,7168,2048,8,384,1,2,power_law_1.01,1.5359487533569336
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,7168,2048,8,384,1,2,balanced,2.1066667238871255
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,7168,2048,8,384,1,2,power_law_1.01,2.9525760650634765
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,7168,2048,8,384,1,2,power_law_1.01,1.6959423065185546
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,7168,2048,8,384,1,2,balanced,2.1546613375345864
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,7168,2048,8,384,1,2,power_law_1.01,3.0930047988891602
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,7168,2048,8,384,1,2,balanced,2.9333225886027017
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,7168,2048,8,384,1,2,power_law_1.01,1.7857215881347657
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,7168,2048,8,384,1,2,power_law_1.01,3.101049613952637
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,7168,2048,8,384,1,2,balanced,2.2653493881225586
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,7168,2048,8,384,1,2,power_law_1.01,1.8515840530395509
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,7168,2048,8,384,1,2,power_law_1.01,3.312723159790039
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,7168,2048,8,384,1,2,power_law_1.01,1.7743616104125977
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,7168,2048,8,384,1,2,power_law_1.01,3.265516662597656
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,7168,2048,8,384,1,2,balanced,3.846991856892904
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,7168,2048,8,384,1,2,power_law_1.01,2.040121650695801
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,7168,2048,8,384,1,2,power_law_1.01,3.603424072265625
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,7168,2048,8,384,1,2,power_law_1.01,0.1807039976119995
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,384,1,2,balanced,2.3556319872538247
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,7168,2048,8,384,1,2,power_law_1.01,2.0666431427001952
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,7168,2048,8,384,1,2,power_law_1.01,4.14637451171875
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,7168,2048,8,384,1,2,power_law_1.01,0.25427200794219973
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,7168,2048,8,384,1,2,power_law_1.01,2.331839942932129
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,7168,2048,8,384,1,2,power_law_1.01,0.41571841239929197
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,7168,2048,8,384,1,2,power_law_1.01,4.986003112792969
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,7168,2048,8,384,1,2,power_law_1.01,2.6402944564819335
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,7168,2048,8,384,1,2,power_law_1.01,0.31893761157989503
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,7168,2048,8,384,1,2,power_law_1.01,5.157676696777344
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,7168,2048,8,384,1,2,balanced,4.2857866287231445
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,7168,2048,8,384,1,2,power_law_1.01,3.2354366302490236
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,7168,2048,8,384,1,2,power_law_1.01,0.5469888210296631
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,7168,2048,8,384,1,2,balanced,18.37291208902995
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,7168,2048,8,384,1,2,power_law_1.01,6.612985229492187
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,7168,2048,8,384,1,2,power_law_1.01,3.410726547241211
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,7168,2048,8,384,1,2,power_law_1.01,0.8163328170776367
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,7168,2048,8,384,1,2,power_law_1.01,5.766380691528321
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,7168,2048,8,384,1,2,power_law_1.01,4.256806564331055
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,384,1,2,balanced,2.5689759254455566
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,7168,2048,8,384,1,2,power_law_1.01,1.0183296203613281
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,7168,2048,8,384,1,2,power_law_1.01,6.870368194580078
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,7168,2048,8,384,1,2,power_law_1.01,1.263424015045166
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,7168,2048,8,384,1,2,power_law_1.01,4.972768020629883
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,384,1,2,balanced,2.7431678771972656
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,7168,2048,8,384,1,2,power_law_1.01,1.327731227874756
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,7168,2048,8,384,1,2,power_law_1.01,6.220614242553711
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,7168,2048,8,384,1,2,power_law_1.01,7.873548889160157
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,7168,2048,8,384,1,2,power_law_1.01,1.4121408462524414
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,384,1,2,balanced,3.070255915323893
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,7168,2048,8,384,1,2,balanced,5.928506851196289
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,7168,2048,8,384,1,2,power_law_1.01,6.751046752929687
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,7168,2048,8,384,1,2,power_law_1.01,9.816703796386719
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,7168,2048,8,384,1,2,power_law_1.01,1.4717887878417968
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,7168,2048,8,384,1,2,power_law_1.01,7.864921569824219
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,7168,2048,8,384,1,2,power_law_1.01,1.528108787536621
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,384,1,2,balanced,3.6206932067871094
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,7168,2048,8,384,1,2,power_law_1.01,11.636863708496094
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,7168,2048,8,384,1,2,power_law_1.01,1.6478015899658203
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,7168,2048,8,384,1,2,power_law_1.01,12.505945587158203
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,7168,2048,8,384,1,2,power_law_1.01,1.7956480026245116
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,7168,2048,8,384,1,2,power_law_1.01,14.002610778808593
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,7168,2048,8,384,1,2,power_law_1.2,0.20275840759277344
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,384,1,2,balanced,4.200645446777344
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,7168,2048,8,384,1,2,power_law_1.01,1.8696319580078125
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,7168,2048,8,384,1,2,power_law_1.01,23.065574645996094
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,7168,2048,8,384,1,2,power_law_1.01,21.03923797607422
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,7168,2048,8,384,1,2,power_law_1.01,1.9816896438598632
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,7168,2048,8,384,1,2,power_law_1.2,0.36009600162506106
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,7168,2048,8,384,1,2,power_law_1.01,2.244620704650879
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,7168,2048,8,384,1,2,balanced,7.608858744303386
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,7168,2048,8,384,1,2,power_law_1.2,0.3832000017166138
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,7168,2048,8,384,1,2,power_law_1.01,2.7250879287719725
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,384,1,2,balanced,6.549109141031901
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,7168,2048,8,384,1,2,power_law_1.2,0.47571840286254885
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,7168,2048,8,384,1,2,power_law_1.01,37.675558471679686
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,7168,2048,8,384,1,2,power_law_1.2,0.861638355255127
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,384,1,2,power_law_1.01,2.6629247665405273
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,7168,2048,8,384,1,2,power_law_1.2,1.3254783630371094
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,7168,2048,8,384,1,2,power_law_1.2,1.579263973236084
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,384,1,2,power_law_1.01,2.6463104248046876
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,384,1,2,balanced,7.967749277750651
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,7168,2048,8,384,1,2,power_law_1.2,2.302988815307617
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,384,1,2,power_law_1.01,3.0618688583374025
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,7168,2048,8,384,1,2,power_law_1.2,2.440447998046875
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,7168,2048,8,384,1,2,balanced,34.02086893717448
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,384,1,2,power_law_1.01,4.021664047241211
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,7168,2048,8,384,1,2,power_law_1.2,2.5424192428588865
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,384,1,2,power_law_1.01,4.202054214477539
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,7168,2048,8,384,1,2,power_law_1.2,2.640915107727051
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,384,1,2,power_law_1.01,5.581292724609375
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,7168,2048,8,384,1,2,balanced,11.175360361735025
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,7168,2048,8,384,1,2,power_law_1.2,2.7946239471435548
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,384,1,2,power_law_1.01,6.837248229980469
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,384,1,2,balanced,11.393973032633463
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,7168,2048,8,384,1,2,power_law_1.2,2.8144319534301756
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,384,1,2,power_law_1.01,10.11470718383789
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,7168,2048,8,384,1,2,power_law_1.2,2.9159872055053713
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,7168,2048,8,384,1,2,power_law_1.2,3.1854143142700195
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,384,1,2,power_law_1.01,12.741433715820312
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,7168,2048,8,384,1,2,power_law_1.2,3.26429443359375
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,384,1,2,power_law_1.01,16.085530090332032
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,7168,2048,8,384,1,2,power_law_1.2,3.39683837890625
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,7168,2048,8,384,1,2,power_law_1.2,3.7390720367431642
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,384,1,2,power_law_1.01,24.377958679199217
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,7168,2048,8,384,1,2,power_law_1.2,4.463315200805664
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,384,1,2,balanced,15.067754109700521
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,7168,2048,8,384,1,2,power_law_1.2,5.281401443481445
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,7168,2048,8,384,1,2,power_law_1.2,5.523769760131836
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,384,1,2,power_law_1.01,49.524575805664064
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,7168,2048,8,384,1,2,power_law_1.2,6.751321411132812
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,7168,2048,8,384,1,2,power_law_1.2,6.0797374725341795
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,7168,2048,8,384,1,2,power_law_1.2,7.53465576171875
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,7168,2048,8,384,1,2,power_law_1.2,8.76635513305664
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,7168,2048,8,384,1,2,power_law_1.2,10.677011108398437
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,384,1,2,balanced,23.569129943847656
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,7168,2048,8,384,1,2,power_law_1.2,12.790547180175782
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,7168,2048,8,384,1,2,balanced,21.544390360514324
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,7168,2048,8,384,1,2,power_law_1.2,0.1335039973258972
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,7168,2048,8,384,1,2,power_law_1.2,14.889913940429688
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,7168,2048,8,384,1,2,power_law_1.2,0.20353920459747316
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,7168,2048,8,384,1,2,power_law_1.2,0.2329279899597168
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,7168,2048,8,384,1,2,power_law_1.2,24.01136016845703
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,7168,2048,8,384,1,2,power_law_1.2,0.25150721073150634
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,7168,2048,8,384,1,2,power_law_1.2,0.48056960105895996
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,7168,2048,8,384,1,2,power_law_1.2,0.6707776069641114
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,7168,2048,8,384,1,2,power_law_1.2,39.8166015625
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,7168,2048,8,384,1,2,power_law_1.2,0.7971839904785156
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,7168,2048,8,384,1,2,power_law_1.2,1.1622015953063964
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,7168,2048,8,384,1,2,power_law_1.2,1.267916774749756
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,7168,2048,8,384,1,2,power_law_1.2,1.3202688217163085
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,7168,2048,8,384,1,2,power_law_1.2,1.3599167823791505
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,7168,2048,8,384,1,2,power_law_1.2,1.4547391891479493
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,7168,2048,8,384,1,2,power_law_1.2,1.4712767601013184
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,7168,2048,8,384,1,2,power_law_1.2,1.6691776275634767
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,7168,2048,8,384,1,2,power_law_1.2,1.8365375518798828
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,7168,2048,8,384,1,2,power_law_1.2,1.8715904235839844
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,7168,2048,8,384,1,2,power_law_1.2,1.8450944900512696
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,7168,2048,8,384,1,2,power_law_1.2,2.081727981567383
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,7168,2048,8,384,1,2,power_law_1.2,2.1186752319335938
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,7168,2048,8,384,1,2,power_law_1.2,2.505523109436035
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,384,1,2,balanced,46.59713236490885
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,7168,2048,8,384,1,2,power_law_1.2,2.901113510131836
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,7168,2048,8,384,1,2,power_law_1.2,3.413267135620117
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,7168,2048,8,384,1,2,power_law_1.2,3.608915328979492
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,7168,2048,8,384,1,2,power_law_1.2,4.288710403442383
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,7168,2048,8,384,1,2,power_law_1.2,5.345798492431641
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,7168,2048,8,384,1,2,power_law_1.2,6.982028961181641
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,7168,2048,8,384,1,2,power_law_1.2,6.965663909912109
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,7168,2048,8,384,2,1,balanced,0.136245330174764
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,7168,2048,8,384,1,2,power_law_1.2,8.901363372802734
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,7168,2048,8,384,2,1,balanced,0.20198933283487955
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,7168,2048,8,384,2,1,balanced,0.36458667119344074
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,7168,2048,8,384,1,2,power_law_1.2,13.049369812011719
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,7168,2048,8,384,2,1,balanced,0.6958026885986328
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,7168,2048,8,384,1,2,power_law_1.2,0.18078080415725709
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,7168,2048,8,384,2,1,balanced,1.3359626134236653
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,7168,2048,8,384,1,2,power_law_1.2,0.2533951997756958
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,7168,2048,8,384,2,1,balanced,2.612943967183431
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,7168,2048,8,384,2,1,balanced,0.09045867125193278
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,7168,2048,8,384,1,2,power_law_1.2,23.934419250488283
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,7168,2048,8,384,1,2,power_law_1.2,0.2747904062271118
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,7168,2048,8,384,2,1,balanced,3.8839200337727866
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,7168,2048,8,384,2,1,balanced,0.1266986628373464
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,7168,2048,8,384,1,2,power_law_1.2,0.3049920082092285
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,7168,2048,8,384,2,1,balanced,3.9062185287475586
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,7168,2048,8,384,2,1,balanced,0.20878932873408
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,7168,2048,8,384,1,2,power_law_1.2,0.46895360946655273
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,7168,2048,8,384,2,1,balanced,3.910367965698242
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,7168,2048,8,384,2,1,balanced,0.38143467903137207
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,7168,2048,8,384,2,1,balanced,0.7173706690470377
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,7168,2048,8,384,2,1,balanced,3.9130080540974936
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,7168,2048,8,384,1,2,power_law_1.2,0.7253056049346924
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,7168,2048,8,384,2,1,balanced,1.3776853879292805
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,7168,2048,8,384,2,1,balanced,3.9533119201660156
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,7168,2048,8,384,1,2,power_law_1.2,0.853228759765625
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,7168,2048,8,384,2,1,balanced,2.0388693809509277
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,7168,2048,8,384,1,2,power_law_1.2,1.2310463905334472
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,7168,2048,8,384,2,1,balanced,3.9473066329956055
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,7168,2048,8,384,2,1,balanced,2.0467947324117026
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,7168,2048,8,384,1,2,power_law_1.2,1.2752767562866212
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,7168,2048,8,384,2,1,balanced,3.97760009765625
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,7168,2048,8,384,2,1,balanced,2.052720069885254
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,7168,2048,8,384,2,1,balanced,4.00328000386556
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,7168,2048,8,384,1,2,power_law_1.2,1.3355968475341797
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,7168,2048,8,384,2,1,balanced,2.060357411702474
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,7168,2048,8,384,2,1,balanced,4.008330663045247
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,7168,2048,8,384,1,2,power_law_1.2,1.428384017944336
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,7168,2048,8,384,2,1,balanced,2.0560426712036133
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,7168,2048,8,384,2,1,balanced,2.069434642791748
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,7168,2048,8,384,2,1,balanced,4.019445419311523
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,7168,2048,8,384,1,2,power_law_1.2,1.5501824378967286
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,7168,2048,8,384,2,1,balanced,2.0965332984924316
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,7168,2048,8,384,2,1,balanced,4.085013389587402
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,7168,2048,8,384,1,2,power_law_1.2,1.6191295623779296
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,7168,2048,8,384,2,1,balanced,2.1328585942586265
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,7168,2048,8,384,1,2,power_law_1.2,1.7930816650390624
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,7168,2048,8,384,2,1,balanced,4.1434933344523115
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,7168,2048,8,384,2,1,balanced,2.145594596862793
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,7168,2048,8,384,1,2,power_law_1.2,1.9644224166870117
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,7168,2048,8,384,2,1,balanced,2.1859520276387534
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,7168,2048,8,384,2,1,balanced,4.297002792358398
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,7168,2048,8,384,1,2,power_law_1.2,2.032934379577637
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,7168,2048,8,384,2,1,balanced,2.1978294054667153
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,7168,2048,8,384,2,1,balanced,4.440810521443685
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,7168,2048,8,384,1,2,power_law_1.2,2.278425598144531
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,7168,2048,8,384,2,1,balanced,2.2659786542256675
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,7168,2048,8,384,1,2,power_law_1.2,2.816697692871094
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,7168,2048,8,384,2,1,balanced,4.5400800704956055
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,7168,2048,8,384,2,1,balanced,2.2800532976786294
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,7168,2048,8,384,2,1,balanced,2.399855931599935
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,7168,2048,8,384,2,1,balanced,4.795370737711589
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,384,1,2,power_law_1.2,2.7844863891601563
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,7168,2048,8,384,2,1,balanced,2.5702826182047525
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,7168,2048,8,384,2,1,balanced,5.124752044677734
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,384,1,2,power_law_1.2,2.8201152801513674
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,7168,2048,8,384,2,1,balanced,2.7957706451416016
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,384,1,2,power_law_1.2,3.2402687072753906
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,7168,2048,8,384,2,1,balanced,0.1758400003115336
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,384,1,2,power_law_1.2,4.253862380981445
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,7168,2048,8,384,2,1,balanced,5.619269053141276
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,7168,2048,8,384,2,1,balanced,3.0191148122151694
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,7168,2048,8,384,2,1,balanced,0.20671466986338297
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,7168,2048,8,384,2,1,power_law_1.01,0.13327360153198242
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,384,1,2,power_law_1.2,4.423078536987305
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,7168,2048,8,384,2,1,balanced,0.2842186689376831
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,7168,2048,8,384,2,1,power_law_1.01,0.20229120254516603
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,7168,2048,8,384,2,1,balanced,0.4496106704076131
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,384,1,2,power_law_1.2,5.817567825317383
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,7168,2048,8,384,2,1,balanced,0.7457066377003988
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,7168,2048,8,384,2,1,balanced,3.5170987447102866
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,7168,2048,8,384,2,1,power_law_1.01,0.3611327886581421
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,7168,2048,8,384,2,1,balanced,1.394015947977702
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,7168,2048,8,384,2,1,balanced,6.799834569295247
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,384,1,2,power_law_1.2,7.513394927978515
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,7168,2048,8,384,2,1,power_law_1.01,0.47676801681518555
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,7168,2048,8,384,2,1,balanced,2.046138604482015
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,7168,2048,8,384,2,1,balanced,2.0465332667032876
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,7168,2048,8,384,2,1,power_law_1.01,0.9736127853393555
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,384,1,2,power_law_1.2,10.046604919433594
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,7168,2048,8,384,2,1,balanced,2.0545706748962402
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,7168,2048,8,384,2,1,power_law_1.01,1.485203170776367
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,7168,2048,8,384,2,1,balanced,4.471295992533366
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,7168,2048,8,384,2,1,balanced,2.0610292752583823
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,384,1,2,power_law_1.2,12.984005737304688
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,7168,2048,8,384,2,1,power_law_1.01,1.8063871383666992
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,7168,2048,8,384,2,1,balanced,2.0764853159586587
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,7168,2048,8,384,2,1,balanced,7.751898447672526
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,7168,2048,8,384,2,1,balanced,2.1022772789001465
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,7168,2048,8,384,2,1,power_law_1.01,2.3647039413452147
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,384,1,2,power_law_1.2,17.032255554199217
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,7168,2048,8,384,2,1,balanced,2.1131466229756675
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,7168,2048,8,384,2,1,power_law_1.01,2.5496063232421875
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,7168,2048,8,384,2,1,balanced,2.151637395222982
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,7168,2048,8,384,2,1,power_law_1.01,0.09071999788284302
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,7168,2048,8,384,2,1,power_law_1.01,2.630361557006836
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,7168,2048,8,384,2,1,balanced,2.20142396291097
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,7168,2048,8,384,2,1,balanced,5.329600016276042
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,384,1,2,power_law_1.2,25.386936950683594
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,7168,2048,8,384,2,1,power_law_1.01,0.12581119537353516
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,7168,2048,8,384,2,1,balanced,2.2395092646280923
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,7168,2048,8,384,2,1,power_law_1.01,2.7472000122070312
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,7168,2048,8,384,2,1,power_law_1.01,0.20437119007110596
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,7168,2048,8,384,2,1,balanced,2.320469379425049
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,7168,2048,8,384,2,1,power_law_1.01,0.26356480121612547
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,7168,2048,8,384,2,1,power_law_1.01,2.9219072341918944
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,7168,2048,8,384,2,1,power_law_1.01,0.5268735885620117
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,7168,2048,8,384,2,1,balanced,2.478117307027181
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,7168,2048,8,384,2,1,power_law_1.01,2.950271987915039
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,7168,2048,8,384,2,1,balanced,10.500282923380533
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,7168,2048,8,384,2,1,power_law_1.01,0.7822847843170166
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,7168,2048,8,384,2,1,power_law_1.01,0.9164159774780274
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,384,1,2,power_law_1.2,49.41455993652344
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,7168,2048,8,384,2,1,power_law_1.01,3.0432832717895506
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,7168,2048,8,384,2,1,power_law_1.01,1.244979190826416
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,7168,2048,8,384,2,1,power_law_1.01,1.2971263885498048
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,7168,2048,8,384,2,1,power_law_1.01,3.150124740600586
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,7168,2048,8,384,2,1,power_law_1.01,1.3483967781066895
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,7168,2048,8,384,2,1,balanced,7.27461306254069
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,384,2,1,balanced,2.6835734049479165
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,7168,2048,8,384,2,1,power_law_1.01,3.2306175231933594
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,7168,2048,8,384,2,1,power_law_1.01,1.4710783958435059
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,7168,2048,8,384,2,1,power_law_1.01,1.4928576469421386
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,7168,2048,8,384,2,1,power_law_1.01,3.381932830810547
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,7168,2048,8,384,2,1,power_law_1.01,1.5501824378967286
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,7168,2048,8,384,2,1,power_law_1.01,3.822022247314453
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,7168,2048,8,384,2,1,power_law_1.01,1.6180736541748046
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,7168,2048,8,384,2,1,power_law_1.01,1.660927963256836
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,7168,2048,8,384,2,1,power_law_1.01,4.518815994262695
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,7168,2048,8,384,2,1,balanced,13.598709106445312
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,7168,2048,8,384,2,1,power_law_1.01,1.7188543319702148
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,7168,2048,8,384,2,1,power_law_1.01,1.7619903564453125
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,7168,2048,8,384,2,1,power_law_1.01,5.440063858032227
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,384,2,1,balanced,3.059839884440104
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,7168,2048,8,384,2,1,power_law_1.01,1.9373056411743164
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,7168,2048,8,384,2,1,power_law_1.01,2.3650432586669923
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,7168,2048,8,384,2,1,power_law_1.01,5.055020904541015
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,384,2,1,balanced,3.352693239847819
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,7168,2048,8,384,2,1,power_law_1.01,2.921446418762207
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,7168,2048,8,384,2,1,balanced,9.271674474080404
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,7168,2048,8,384,2,1,power_law_1.01,6.131859207153321
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,7168,2048,8,384,2,1,power_law_1.01,0.17481600046157836
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,7168,2048,8,384,2,1,power_law_1.01,2.7283647537231444
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,7168,2048,8,384,2,1,power_law_1.01,0.21422719955444336
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,7168,2048,8,384,2,1,power_law_1.01,5.459328079223633
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,7168,2048,8,384,2,1,power_law_1.01,3.387955093383789
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,384,2,1,balanced,3.8338292439778647
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,7168,2048,8,384,2,1,power_law_1.01,0.29392640590667723
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,7168,2048,8,384,2,1,power_law_1.01,3.1411903381347654
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,7168,2048,8,384,2,1,power_law_1.01,6.775218963623047
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,7168,2048,8,384,2,1,power_law_1.01,0.3264960050582886
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,7168,2048,8,384,2,1,power_law_1.01,3.8956863403320314
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,384,2,1,balanced,4.813653310139974
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,7168,2048,8,384,2,1,power_law_1.01,0.5612031936645507
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,7168,2048,8,384,2,1,power_law_1.01,5.120774459838867
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,7168,2048,8,384,2,1,power_law_1.01,8.711353302001953
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,7168,2048,8,384,2,1,power_law_1.01,0.8193728446960449
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,7168,2048,8,384,2,1,power_law_1.01,6.626335906982422
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,7168,2048,8,384,2,1,power_law_1.01,0.964345645904541
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,7168,2048,8,384,2,1,power_law_1.01,10.88055648803711
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,7168,2048,8,384,2,1,power_law_1.01,1.2809344291687013
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,7168,2048,8,384,2,1,power_law_1.01,7.933074951171875
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,384,2,1,balanced,5.889578501383464
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,7168,2048,8,384,2,1,power_law_1.01,1.3323007583618165
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,7168,2048,8,384,2,1,power_law_1.01,12.310214233398437
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,7168,2048,8,384,2,1,balanced,19.972405751546223
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,7168,2048,8,384,2,1,power_law_1.01,9.500556945800781
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,7168,2048,8,384,2,1,power_law_1.01,1.423699188232422
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,7168,2048,8,384,2,1,power_law_1.01,14.831590270996093
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,7168,2048,8,384,2,1,power_law_1.01,14.712460327148438
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,7168,2048,8,384,2,1,power_law_1.01,1.4940287590026855
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,7168,2048,8,384,2,1,power_law_1.01,1.556383991241455
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,384,2,1,balanced,9.082346598307291
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,7168,2048,8,384,2,1,power_law_1.01,1.6587520599365235
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,7168,2048,8,384,2,1,balanced,13.876229604085287
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,7168,2048,8,384,2,1,power_law_1.01,21.946989440917967
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,7168,2048,8,384,2,1,power_law_1.01,29.652801513671875
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,7168,2048,8,384,2,1,power_law_1.01,1.8190847396850587
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,7168,2048,8,384,2,1,power_law_1.01,1.9734336853027343
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,7168,2048,8,384,2,1,power_law_1.01,2.055891227722168
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,7168,2048,8,384,2,1,power_law_1.01,2.3458560943603515
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,7168,2048,8,384,2,1,power_law_1.01,43.2653564453125
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,384,2,1,balanced,11.48794682820638
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,7168,2048,8,384,2,1,power_law_1.2,0.13327360153198242
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,7168,2048,8,384,2,1,power_law_1.01,2.8650880813598634
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,7168,2048,8,384,2,1,power_law_1.2,0.20330240726470947
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,7168,2048,8,384,2,1,power_law_1.2,0.2716671943664551
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,384,2,1,power_law_1.01,3.013088035583496
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,7168,2048,8,384,2,1,power_law_1.2,0.47829761505126955
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,7168,2048,8,384,2,1,power_law_1.2,0.8115263938903808
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,384,2,1,power_law_1.01,3.0724159240722657
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,7168,2048,8,384,2,1,power_law_1.2,1.2804224014282226
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,384,2,1,balanced,16.05946095784505
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,384,2,1,power_law_1.01,3.609772872924805
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,7168,2048,8,384,2,1,power_law_1.2,1.5112000465393067
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,384,2,1,power_law_1.01,4.683225631713867
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,7168,2048,8,384,2,1,power_law_1.2,2.188857650756836
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,384,2,1,power_law_1.01,5.223283386230468
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,7168,2048,8,384,2,1,power_law_1.2,2.425350379943848
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,384,2,1,power_law_1.01,7.036294555664062
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,7168,2048,8,384,2,1,power_law_1.2,2.476947212219238
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,7168,2048,8,384,2,1,power_law_1.2,2.699123191833496
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,384,2,1,power_law_1.01,8.803858947753906
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,7168,2048,8,384,2,1,power_law_1.2,2.8255807876586916
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,7168,2048,8,384,2,1,power_law_1.2,2.9671424865722655
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,384,2,1,power_law_1.01,12.454694366455078
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,384,2,1,balanced,20.9682133992513
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,7168,2048,8,384,2,1,balanced,39.58293914794922
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,7168,2048,8,384,2,1,power_law_1.2,3.011929512023926
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,384,2,1,power_law_1.01,16.109068298339842
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,7168,2048,8,384,2,1,power_law_1.2,3.126790428161621
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,7168,2048,8,384,2,1,power_law_1.2,3.2613887786865234
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,384,2,1,power_law_1.01,19.826329040527344
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,7168,2048,8,384,2,1,balanced,27.270960489908855
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,7168,2048,8,384,2,1,power_law_1.2,3.5036224365234374
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,7168,2048,8,384,2,1,power_law_1.2,3.849363327026367
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,384,2,1,power_law_1.01,31.188204956054687
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,7168,2048,8,384,2,1,power_law_1.2,4.731801605224609
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,7168,2048,8,384,2,1,power_law_1.2,5.571718215942383
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,7168,2048,8,384,2,1,power_law_1.2,5.361785507202148
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,384,2,1,power_law_1.01,61.2527587890625
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,7168,2048,8,384,2,1,power_law_1.2,6.420864105224609
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,384,2,1,balanced,32.35040537516276
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,7168,2048,8,384,2,1,power_law_1.2,5.8008575439453125
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,7168,2048,8,384,2,1,power_law_1.2,6.915737915039062
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,7168,2048,8,384,2,1,power_law_1.2,9.258521270751952
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,7168,2048,8,384,2,1,power_law_1.2,11.535052490234374
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,7168,2048,8,384,2,1,power_law_1.2,12.951686096191406
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,7168,2048,8,384,2,1,power_law_1.2,15.367059326171875
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,7168,2048,8,384,2,1,power_law_1.2,0.0895359992980957
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,7168,2048,8,384,2,1,power_law_1.2,0.12577279806137084
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,7168,2048,8,384,2,1,power_law_1.2,22.668800354003906
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,7168,2048,8,384,2,1,power_law_1.2,0.15488640069961548
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,7168,2048,8,384,2,1,power_law_1.2,0.26872959136962893
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,7168,2048,8,384,2,1,power_law_1.2,0.44481282234191893
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,7168,2048,8,384,2,1,power_law_1.2,0.6772543907165527
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,7168,2048,8,384,2,1,power_law_1.2,0.7839488029479981
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,7168,2048,8,384,2,1,power_law_1.2,42.79021301269531
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,7168,2048,8,384,2,1,power_law_1.2,1.1507840156555176
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,7168,2048,8,384,2,1,power_law_1.2,1.219264030456543
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,7168,2048,8,384,2,1,power_law_1.2,1.3240511894226075
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,7168,2048,8,384,2,1,power_law_1.2,1.3933376312255858
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,7168,2048,8,384,2,1,power_law_1.2,1.4595904350280762
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,7168,2048,8,384,2,1,power_law_1.2,1.5116543769836426
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,7168,2048,8,384,2,1,power_law_1.2,1.6116544723510742
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,7168,2048,8,384,2,1,power_law_1.2,1.6086912155151367
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,7168,2048,8,384,2,1,power_law_1.2,1.7221759796142577
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,7168,2048,8,384,2,1,power_law_1.2,1.823788833618164
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,384,2,1,balanced,64.29201761881511
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,7168,2048,8,384,2,1,power_law_1.2,1.974470329284668
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,7168,2048,8,384,2,1,power_law_1.2,2.446579170227051
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,7168,2048,8,384,2,1,power_law_1.2,3.0127231597900392
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,7168,2048,8,384,2,1,power_law_1.2,2.9411264419555665
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,7168,2048,8,384,2,1,power_law_1.2,3.6060417175292967
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,7168,2048,8,384,2,1,power_law_1.2,3.374470520019531
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,7168,2048,8,384,2,1,power_law_1.2,4.173356628417968
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,7168,2048,8,384,2,1,power_law_1.2,5.381267166137695
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,7168,2048,8,384,2,1,power_law_1.2,6.928076934814453
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,7168,2048,8,384,2,1,power_law_1.2,8.253343963623047
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,128,1,2,balanced,0.07162666817506154
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,7168,2048,8,384,2,1,power_law_1.2,9.821913909912109
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,128,1,2,balanced,0.08868267138799031
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,7168,2048,8,384,2,1,power_law_1.2,15.129971313476563
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,7168,2048,8,384,2,1,power_law_1.2,0.17488640546798706
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,7168,2048,8,384,2,1,power_law_1.2,0.21324799060821534
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,7168,2048,8,384,2,1,power_law_1.2,0.2522304058074951
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,128,1,2,balanced,0.10765332976977031
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,7168,2048,8,384,2,1,power_law_1.2,29.458746337890624
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,7168,2048,8,384,2,1,power_law_1.2,0.3365247964859009
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,7168,2048,8,384,2,1,power_law_1.2,0.5181759834289551
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,7168,2048,8,384,2,1,power_law_1.2,0.7280255794525147
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,128,1,2,balanced,0.11795733372370402
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,7168,2048,8,384,2,1,power_law_1.2,0.8754431724548339
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,128,1,2,power_law_1.01,0.10282880067825317
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,7168,2048,8,384,2,1,power_law_1.2,1.2315711975097656
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,128,1,2,power_law_1.01,0.126636803150177
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,7168,2048,8,384,2,1,power_law_1.2,1.2862784385681152
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,128,1,2,balanced,0.17997332413991293
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,128,1,2,power_law_1.01,0.11734399795532227
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,7168,2048,8,384,2,1,power_law_1.2,1.3362175941467285
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,128,1,2,power_law_1.01,0.09967359900474548
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,7168,2048,8,384,2,1,power_law_1.2,1.4442048072814941
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,128,1,2,power_law_1.01,0.14473600387573243
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,128,1,2,balanced,0.3171093265215556
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,7168,2048,8,384,2,1,power_law_1.2,1.546412754058838
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,128,1,2,power_law_1.01,0.15777920484542846
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,128,1,2,power_law_1.2,0.10200320482254029
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,128,1,2,balanced,0.31994134187698364
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,128,1,2,power_law_1.01,0.23457279205322265
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,7168,2048,8,384,2,1,power_law_1.2,1.658188819885254
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,128,1,2,balanced,0.31921066840489704
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,128,1,2,power_law_1.2,0.12777600288391114
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,128,1,2,power_law_1.01,0.2396928071975708
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,7168,2048,8,384,2,1,power_law_1.2,1.7851648330688477
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,128,1,2,balanced,0.3190613389015198
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,128,1,2,power_law_1.2,0.10574719905853272
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,128,1,2,power_law_1.01,0.2551039934158325
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,128,1,2,balanced,0.31947733958562213
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,7168,2048,8,384,2,1,power_law_1.2,1.9545343399047852
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,128,1,2,power_law_1.2,0.10738559961318969
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,128,1,2,power_law_1.01,0.25992960929870607
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,128,1,2,balanced,0.32100266218185425
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,7168,2048,8,384,2,1,power_law_1.2,2.0782144546508787
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,128,1,2,power_law_1.2,0.13782399892807007
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,128,1,2,balanced,0.3204266627629598
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,128,1,2,power_law_1.01,0.2694591999053955
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,128,1,2,power_law_1.2,0.1664639949798584
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,7168,2048,8,384,2,1,power_law_1.2,2.359052848815918
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,128,1,2,balanced,0.32128532727559406
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,128,1,2,power_law_1.01,0.294707202911377
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,128,1,2,power_law_1.2,0.2288383960723877
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,7168,2048,8,384,2,1,power_law_1.2,2.8825536727905274
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,128,1,2,balanced,0.3219573299090068
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,128,1,2,power_law_1.01,0.3123647928237915
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,128,1,2,power_law_1.2,0.251910400390625
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,128,2,1,balanced,0.06940799951553345
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,128,1,2,power_law_1.01,0.34408960342407224
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,128,1,2,power_law_1.2,0.2452608108520508
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,384,2,1,power_law_1.2,3.020512008666992
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,128,1,2,power_law_1.2,0.27552640438079834
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,128,2,1,balanced,0.08685333530108134
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,128,1,2,power_law_1.2,0.29986560344696045
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,128,1,2,balanced,0.3727840185165405
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,128,1,2,power_law_1.01,0.37372798919677735
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,128,1,2,power_law_1.2,0.3065407991409302
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,128,1,2,balanced,0.37379733721415204
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,128,1,2,power_law_1.01,0.38726398944854734
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,384,2,1,power_law_1.2,3.207001495361328
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,128,2,1,balanced,0.1157973309357961
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,128,1,2,balanced,0.3752959966659546
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,128,1,2,power_law_1.2,0.3132607936859131
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,128,1,2,power_law_1.01,0.42529921531677245
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,384,2,1,power_law_1.2,3.740371322631836
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,128,2,1,balanced,0.1413386662801107
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,128,1,2,power_law_1.2,0.3883455991744995
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,128,2,1,balanced,0.18086934089660645
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,384,2,1,power_law_1.2,4.798828887939453
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,128,1,2,power_law_1.2,0.38449280261993407
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,128,2,1,balanced,0.3285706639289856
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,128,1,2,power_law_1.2,0.40780158042907716
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,384,2,1,power_law_1.2,5.433811187744141
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,128,2,1,balanced,0.33058667182922363
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,128,1,2,balanced,0.49929598967234295
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,128,1,2,power_law_1.2,0.44971518516540526
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,128,1,2,power_law_1.01,0.5565887928009033
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,384,2,1,power_law_1.2,7.173312377929688
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,128,2,1,power_law_1.01,0.06851840019226074
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,128,2,1,balanced,0.33082133531570435
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,128,1,2,power_law_1.01,0.6155072212219238
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,128,1,2,power_law_1.2,0.5792640209197998
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,128,1,2,balanced,0.5040906667709351
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,128,2,1,power_law_1.01,0.08596479892730713
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,128,2,1,balanced,0.33183467388153076
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,384,2,1,power_law_1.2,8.990611267089843
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,128,1,2,power_law_1.2,0.6693888187408448
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,128,1,2,power_law_1.01,1.174015998840332
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,128,1,2,balanced,1.0252479712168376
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,128,2,1,power_law_1.01,0.09754239916801452
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,128,2,1,balanced,0.33188800017038983
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,128,1,2,power_law_1.2,1.2632320404052735
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,128,1,2,power_law_1.01,1.3479743957519532
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,128,1,2,balanced,1.0336000124613445
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,128,2,1,power_law_1.01,0.12501120567321777
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,384,2,1,power_law_1.2,12.677375793457031
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,128,2,1,balanced,0.3317813277244568
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,128,1,2,power_law_1.2,1.452000045776367
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,128,1,2,power_law_1.01,1.5781375885009765
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,128,2,1,power_law_1.01,0.12628480195999145
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,128,1,2,balanced,1.064090649286906
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,128,2,1,balanced,0.33259199062983197
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,128,1,2,power_law_1.2,1.667795181274414
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,128,1,2,power_law_1.01,1.9541376113891602
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,384,2,1,power_law_1.2,16.173440551757814
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,128,2,1,power_law_1.01,0.16778240203857422
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,128,2,1,balanced,0.33235732714335126
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,128,1,2,power_law_1.2,1.9964672088623048
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,128,1,2,power_law_1.01,2.400588798522949
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,128,1,2,balanced,1.0840906302134197
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,128,2,1,power_law_1.01,0.2280832052230835
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,128,2,1,balanced,0.3344586690266927
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,128,1,2,power_law_1.2,2.8170623779296875
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,128,1,2,power_law_1.01,2.9876352310180665
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,384,2,1,power_law_1.2,19.774847412109374
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,128,2,1,power_law_1.01,0.24926719665527344
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,128,2,1,balanced,0.3358773390452067
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,128,1,2,balanced,2.0598665873209634
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,128,2,1,power_law_1.01,0.2560447931289673
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,128,1,2,power_law_1.2,3.307167816162109
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,128,1,2,power_law_1.01,4.131603240966797
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,128,2,1,balanced,0.3370453516642253
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,128,2,1,power_law_1.01,0.26831998825073244
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,128,2,1,balanced,0.3387840191523234
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,128,1,2,power_law_1.2,4.482470321655273
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,128,1,2,power_law_1.01,5.556006240844726
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,384,2,1,power_law_1.2,30.859115600585938
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,128,2,1,power_law_1.01,0.27164158821105955
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,128,1,2,balanced,2.109557310740153
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,128,2,1,balanced,0.4004053274790446
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,128,1,2,power_law_1.2,5.783903884887695
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,128,1,2,power_law_1.01,6.7655998229980465
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,128,2,1,power_law_1.01,0.29295361042022705
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,128,2,1,balanced,0.4039253393809001
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,128,1,2,power_law_1.2,6.706566619873047
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,128,2,1,power_law_1.01,0.3113343954086304
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,128,1,2,power_law_1.01,10.327251434326172
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,128,2,1,power_law_1.2,0.06934400200843811
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,128,2,1,balanced,0.5428320169448853
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,128,1,2,balanced,3.120527903238932
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,128,2,1,power_law_1.01,0.3526463985443115
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,128,1,2,power_law_1.2,11.062655639648437
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,128,2,1,power_law_1.2,0.085971200466156
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,384,2,1,power_law_1.2,60.41748046875
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,128,2,1,balanced,0.5536160071690878
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,128,2,1,power_law_1.01,0.38913280963897706
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,128,1,2,power_law_1.01,19.70665588378906
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,128,2,1,power_law_1.2,0.09253119826316833
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,128,2,1,power_law_1.01,0.4158912181854248
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,128,2,1,balanced,1.136895974477132
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,128,1,2,power_law_1.2,18.873011779785156
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,128,2,1,power_law_1.2,0.11898239850997924
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,128,2,1,power_law_1.01,0.5003903865814209
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,128,1,2,balanced,4.152880032857259
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,128,2,1,power_law_1.2,0.12298879623413086
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,128,2,1,balanced,1.1627093156178792
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,128,2,1,power_law_1.01,0.5195712089538574
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,128,2,1,power_law_1.2,0.15151360034942626
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,128,2,1,power_law_1.01,0.6050367832183838
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,128,2,1,power_law_1.2,0.2256704092025757
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,128,2,1,balanced,2.1954612731933594
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,128,2,1,power_law_1.01,0.7276864051818848
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,128,2,1,power_law_1.2,0.23861119747161866
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,128,2,1,power_law_1.01,0.8533632278442382
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,128,2,1,power_law_1.2,0.2508863925933838
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,128,1,2,balanced,5.162554740905762
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,128,2,1,balanced,2.2504213651021323
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,128,2,1,power_law_1.01,1.6105728149414062
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,128,2,1,power_law_1.2,0.26363520622253417
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,128,2,1,power_law_1.01,1.901375961303711
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,128,2,1,power_law_1.2,0.28954880237579345
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,128,2,1,power_law_1.01,2.420774459838867
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,128,2,1,power_law_1.2,0.3105151891708374
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,128,2,1,balanced,3.3321708043416343
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,128,2,1,power_law_1.2,0.31870720386505125
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,128,2,1,power_law_1.01,2.9827648162841798
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,128,2,1,power_law_1.2,0.36414079666137694
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,128,2,1,power_law_1.01,4.062137603759766
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,128,2,1,power_law_1.2,0.40190720558166504
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,128,1,2,balanced,8.225658416748047
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,128,2,1,power_law_1.01,5.132588958740234
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,128,2,1,power_law_1.2,0.44479999542236326
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,128,2,1,power_law_1.2,0.520959997177124
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,128,2,1,balanced,4.432714780171712
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,128,2,1,power_law_1.01,6.247814559936524
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,128,2,1,power_law_1.2,0.5354688167572021
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,128,2,1,power_law_1.01,9.498880004882812
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,128,2,1,power_law_1.2,0.6298687934875489
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,32,1,2,balanced,0.07077866792678833
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,128,2,1,power_law_1.2,0.7742271900177002
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,128,2,1,power_law_1.01,18.480921936035156
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,128,2,1,power_law_1.2,0.8997504234313964
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,32,1,2,balanced,0.08884800473848979
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,128,2,1,balanced,5.5213063557942705
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,128,2,1,power_law_1.2,1.6670848846435546
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,128,2,1,power_law_1.2,1.957472038269043
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,32,1,2,balanced,0.10589866836865743
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,128,2,1,power_law_1.2,2.522598457336426
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,128,2,1,power_law_1.2,3.045894432067871
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,128,2,1,power_law_1.2,4.155654525756836
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,32,1,2,balanced,0.11623467008272807
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,128,1,2,balanced,16.58032480875651
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,128,2,1,power_law_1.2,5.240326309204102
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,128,2,1,balanced,8.80022939046224
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,128,2,1,power_law_1.2,6.259961700439453
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,32,1,2,balanced,0.10730133454004924
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,32,1,2,balanced,0.11505599816640218
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,128,2,1,power_law_1.2,9.512268829345704
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,32,1,2,balanced,0.11577066779136658
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,32,1,2,balanced,0.11540800333023071
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,128,2,1,power_law_1.2,18.453369140625
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,32,1,2,balanced,0.12083733081817627
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,32,1,2,balanced,0.1209333340326945
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,32,1,2,balanced,0.121370663245519
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,32,1,2,balanced,0.1607253352801005
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,128,2,1,balanced,17.78528594970703
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,32,1,2,balanced,0.15967999895413718
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,32,1,2,balanced,0.16090133786201477
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,32,1,2,balanced,0.28730666637420654
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,32,1,2,balanced,0.28787734111150104
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,32,1,2,balanced,0.2905600070953369
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,32,1,2,balanced,0.2930399974187215
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,32,1,2,balanced,0.29687466224034625
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,32,1,2,balanced,0.5525013208389282
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,32,1,2,balanced,0.5592853228251139
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,32,1,2,balanced,0.8149440288543701
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,32,1,2,balanced,1.0726880232493083
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,32,1,2,balanced,1.5878933270772297
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,32,1,2,balanced,2.1113120714823403
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,32,1,2,power_law_1.01,0.09279999732971192
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,32,1,2,balanced,3.1173388163248696
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,32,1,2,power_law_1.01,0.10126719474792481
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,32,1,2,power_law_1.01,0.10835839509963989
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,32,1,2,power_law_1.01,0.09383040070533752
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,32,1,2,power_law_1.01,0.10521600246429444
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,32,1,2,balanced,4.151717185974121
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,32,1,2,power_law_1.01,0.11214079856872558
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,32,1,2,power_law_1.01,0.12163840532302857
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,32,1,2,power_law_1.01,0.1277184009552002
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,32,1,2,power_law_1.01,0.1365056037902832
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,32,1,2,balanced,5.167861302693685
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,32,1,2,power_law_1.01,0.1301632046699524
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,32,1,2,power_law_1.2,0.0905023992061615
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,32,1,2,power_law_1.01,0.14888319969177247
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,32,2,1,balanced,0.06869333485762279
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,32,1,2,power_law_1.2,0.0937279999256134
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,32,1,2,power_law_1.01,0.1746880054473877
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,32,1,2,power_law_1.2,0.10817919969558716
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,32,1,2,power_law_1.01,0.1769152045249939
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,32,1,2,power_law_1.2,0.09531520009040832
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,32,2,1,balanced,0.08585066596666972
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,32,1,2,power_law_1.01,0.19496320486068724
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,32,1,2,power_law_1.2,0.10392320156097412
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,32,1,2,power_law_1.01,0.3403007984161377
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,32,1,2,power_law_1.2,0.11531519889831543
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,32,1,2,balanced,8.259312311808268
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,32,1,2,power_law_1.01,0.3505664110183716
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,32,1,2,power_law_1.2,0.1223423957824707
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,32,2,1,balanced,0.1122826635837555
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,32,1,2,power_law_1.01,0.3976639986038208
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,32,1,2,power_law_1.2,0.1270591974258423
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,32,2,1,balanced,0.13939733306566873
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,32,1,2,power_law_1.01,0.4443967819213867
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,32,1,2,power_law_1.2,0.14097280502319337
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,32,2,1,balanced,0.10386133193969727
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,32,2,1,balanced,0.10379200180371602
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,32,1,2,power_law_1.2,0.13925119638442993
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,32,1,2,power_law_1.01,0.5310976028442382
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,32,2,1,power_law_1.01,0.06647679805755616
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,32,1,2,power_law_1.2,0.14710400104522706
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,32,2,1,balanced,0.10486933588981628
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,32,1,2,power_law_1.01,0.7100992202758789
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,32,2,1,power_law_1.01,0.07715200185775757
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,32,2,1,balanced,0.10457600156466167
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,32,1,2,power_law_1.2,0.17541120052337647
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,32,1,2,power_law_1.01,0.7796544075012207
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,32,2,1,power_law_1.01,0.09708799719810486
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,32,2,1,balanced,0.10494400064150493
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,32,2,1,power_law_1.01,0.09304959774017334
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,32,1,2,power_law_1.2,0.18506239652633666
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,32,1,2,power_law_1.01,1.1204607963562012
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,32,2,1,power_law_1.01,0.10218240022659301
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,32,2,1,balanced,0.1051680048306783
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,32,1,2,power_law_1.2,0.19426560401916504
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,32,2,1,power_law_1.01,0.10305919647216796
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,32,1,2,power_law_1.01,1.5826944351196288
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,32,2,1,balanced,0.1048426628112793
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,32,2,1,power_law_1.01,0.11335680484771729
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,32,1,2,power_law_1.2,0.35342719554901125
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,32,1,2,power_law_1.01,2.106169509887695
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,32,2,1,power_law_1.01,0.12039040327072144
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,32,2,1,balanced,0.1188159982363383
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,32,1,2,power_law_1.2,0.35893759727478025
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,32,2,1,power_law_1.01,0.12952959537506104
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,32,1,2,power_law_1.01,2.9481855392456056
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,32,2,1,balanced,0.11931199828783672
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,32,1,2,power_law_1.2,0.379532790184021
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,32,2,1,power_law_1.01,0.1340288043022156
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,32,2,1,power_law_1.01,0.15294719934463502
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,32,2,1,balanced,0.1202186644077301
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,32,1,2,power_law_1.01,4.302451324462891
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,32,1,2,power_law_1.2,0.47735037803649905
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,32,2,1,power_law_1.01,0.14703359603881835
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,32,1,2,balanced,16.476795196533203
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,32,2,1,power_law_1.2,0.06654719710350036
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,32,2,1,balanced,0.15028267105420431
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,32,1,2,power_law_1.2,0.5818880081176758
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,32,2,1,power_law_1.01,0.15726079940795898
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,32,1,2,power_law_1.01,5.622476959228516
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,32,2,1,power_law_1.01,0.17526400089263916
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,32,2,1,balanced,0.15161066253980002
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,32,2,1,power_law_1.2,0.07559040188789368
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,32,1,2,power_law_1.2,0.6826240062713623
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,32,2,1,power_law_1.01,0.20083839893341066
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,32,1,2,power_law_1.01,6.353132629394532
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,32,2,1,balanced,0.15405866503715515
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,32,2,1,power_law_1.2,0.08613759875297547
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,32,1,2,power_law_1.2,0.8543744087219238
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,32,2,1,power_law_1.01,0.22065279483795167
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,32,2,1,balanced,0.3055093288421631
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,32,2,1,power_law_1.2,0.08213120102882385
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,32,1,2,power_law_1.2,1.2551424026489257
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,32,1,2,power_law_1.01,10.680678558349609
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,32,2,1,power_law_1.01,0.2423935890197754
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,32,2,1,power_law_1.2,0.10243200063705445
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,32,1,2,power_law_1.2,1.4557439804077148
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,32,2,1,balanced,0.3106773296991984
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,32,2,1,power_law_1.01,0.4475071907043457
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,4096,14336,2,8,1,4,balanced,0.1411946713924408
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,32,2,1,power_law_1.2,0.10474239587783814
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,32,2,1,power_law_1.01,0.4963071823120117
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,32,1,2,power_law_1.2,2.1984384536743162
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,32,2,1,balanced,0.5786346594492594
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,32,1,2,power_law_1.01,23.631724548339843
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,32,2,1,power_law_1.01,0.6306303977966309
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,4096,14336,2,8,1,4,balanced,0.11681600411732991
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,32,2,1,power_law_1.2,0.11634559631347656
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,32,1,2,power_law_1.2,3.2477886199951174
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,32,2,1,balanced,0.5898880163828532
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,32,2,1,power_law_1.01,0.7690303802490235
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,4096,14336,2,8,1,4,balanced,0.18869332472483316
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,32,2,1,power_law_1.2,0.12268160581588745
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,32,2,1,power_law_1.01,1.0376319885253906
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,32,1,2,power_law_1.2,3.7996864318847656
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,4096,14336,2,8,1,4,balanced,0.18872000773747763
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,32,2,1,power_law_1.2,0.12995200157165526
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,32,2,1,balanced,0.8698933124542236
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,32,2,1,power_law_1.01,1.3063551902770996
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,4096,14336,2,8,1,4,balanced,0.19056532780329385
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,32,2,1,power_law_1.2,0.14030719995498658
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,32,1,2,power_law_1.2,5.60302734375
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,4096,14336,2,8,1,4,balanced,0.19041067361831665
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,32,2,1,power_law_1.01,1.8550975799560547
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,32,2,1,balanced,1.1489653587341309
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,32,2,1,power_law_1.2,0.1534719944000244
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,4096,14336,2,8,1,4,balanced,0.1923840045928955
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,32,1,2,power_law_1.2,7.479052734375
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,32,2,1,power_law_1.01,2.4144704818725584
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,4096,14336,2,8,1,4,balanced,0.0881119966506958
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,32,2,1,power_law_1.2,0.1491968035697937
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,4096,14336,2,8,1,4,balanced,0.19369600216547647
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,32,2,1,power_law_1.01,3.4922367095947267
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,32,2,1,balanced,1.692911942799886
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,4096,14336,2,8,1,4,balanced,0.0839466651280721
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,32,1,2,power_law_1.2,11.031513977050782
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,32,2,1,power_law_1.2,0.16173440217971802
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,4096,14336,2,8,1,4,balanced,0.20076799392700195
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,32,2,1,power_law_1.01,4.58587532043457
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,4096,14336,2,8,1,4,balanced,0.12334932883580525
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,4096,14336,2,8,1,4,balanced,0.20344533522923788
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,32,2,1,power_law_1.01,5.693779373168946
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,32,2,1,power_law_1.2,0.17845760583877562
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,4096,14336,2,8,1,4,balanced,0.12007466952006023
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,32,2,1,balanced,2.2431413332621255
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,4096,14336,2,8,1,4,balanced,0.21369065841039023
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,32,2,1,power_law_1.2,0.20799999237060546
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,32,2,1,power_law_1.01,8.970336151123046
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,32,1,2,power_law_1.2,24.84685363769531
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,4096,14336,2,8,1,4,balanced,0.12096533179283142
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,4096,14336,2,8,1,4,balanced,0.2172373334566752
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,32,2,1,power_law_1.2,0.22278399467468263
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,4096,14336,2,8,1,4,balanced,0.12131733695665996
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,4096,14336,2,8,1,4,balanced,0.21967999140421549
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,32,2,1,power_law_1.2,0.25489280223846433
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,32,2,1,power_law_1.01,17.69233856201172
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,4096,14336,2,8,1,4,balanced,0.12250666817029317
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,4096,14336,2,8,1,4,balanced,0.22349333763122559
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,32,2,1,balanced,3.3320639928181968
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,32,2,1,power_law_1.2,0.4443903923034668
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,4096,14336,2,8,1,4,balanced,0.12473066647847493
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,4096,14336,2,8,1,4,balanced,0.24636266628901163
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,32,2,1,power_law_1.2,0.522976016998291
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,4096,14336,2,8,1,4,balanced,0.12603200475374857
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,4096,14336,2,8,1,4,balanced,0.2467306653658549
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,32,2,1,power_law_1.2,0.6359615802764893
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,4096,14336,2,8,1,4,balanced,0.1254026691118876
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,4096,14336,2,8,1,4,balanced,0.24566932519276938
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,32,2,1,power_law_1.2,0.7823232173919678
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,4096,14336,2,8,1,4,balanced,0.13275733590126038
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,32,2,1,balanced,4.431578636169434
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,4096,14336,2,8,1,4,balanced,0.3404426574707031
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,4096,14336,2,8,1,4,balanced,0.13108799854914346
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,32,2,1,power_law_1.2,1.0503552436828614
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,4096,14336,2,8,1,4,balanced,0.13293332854906717
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,4096,14336,2,8,1,4,balanced,0.3531999985376994
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,32,2,1,power_law_1.2,1.309715175628662
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,4096,14336,2,8,1,4,balanced,0.13110933701197305
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,4096,14336,2,8,1,4,balanced,0.5092053413391113
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,32,2,1,power_law_1.2,1.8520000457763672
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,4096,14336,2,8,1,4,balanced,0.1591253379980723
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,4096,14336,2,8,1,4,balanced,0.5581386486689249
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,32,2,1,power_law_1.2,2.405708885192871
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,4096,14336,2,8,1,4,balanced,0.15933866302172342
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,32,2,1,balanced,5.525994618733724
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,4096,14336,2,8,1,4,balanced,0.1558080017566681
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,4096,14336,2,8,1,4,balanced,0.7962133089701334
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,32,2,1,power_law_1.2,3.5075710296630858
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,4096,14336,2,8,1,4,balanced,0.208624005317688
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,4096,14336,2,8,1,4,balanced,0.9918986956278483
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,32,2,1,power_law_1.2,4.568544006347656
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,4096,14336,2,8,1,4,balanced,0.22630399465560913
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,32,2,1,power_law_1.2,5.648396682739258
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,4096,14336,2,8,1,4,balanced,1.4350719451904297
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,4096,14336,2,8,1,4,balanced,0.28217599789301556
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,32,2,1,power_law_1.2,8.94579849243164
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,4096,14336,2,8,1,4,balanced,0.3169333338737488
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,4096,14336,2,8,1,4,balanced,1.7984426816304524
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,4096,14336,2,8,1,4,balanced,0.47013334433237713
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,32,2,1,balanced,8.817850748697916
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,32,2,1,power_law_1.2,17.728504943847657
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,4096,14336,2,8,1,4,balanced,2.645146687825521
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,4096,14336,2,8,1,4,balanced,0.5798879861831665
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,4096,14336,2,8,1,4,balanced,0.8459786574045817
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,4096,14336,2,8,1,4,balanced,3.563824017842611
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,4096,14336,2,8,1,4,balanced,1.1682933171590169
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,4096,14336,2,8,1,4,balanced,4.371466636657715
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,4096,14336,2,8,1,4,balanced,1.699728012084961
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,4096,14336,2,8,1,4,balanced,2.2353386878967285
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,4096,14336,2,8,1,4,balanced,7.3046080271403
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,4096,14336,2,8,1,4,balanced,2.7532641092936196
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,32,2,1,balanced,17.741104125976562
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,4096,14336,2,8,1,4,balanced,4.499429384867351
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,4096,14336,2,8,1,4,balanced,14.8210080464681
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,4096,14336,2,8,1,4,balanced,8.668261210123697
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,4096,14336,2,8,1,4,power_law_1.01,0.21700479984283447
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,4096,14336,2,8,1,4,power_law_1.01,0.14368000030517578
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,4096,14336,2,8,1,4,balanced,0.07434666653474171
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,4096,14336,2,8,1,4,power_law_1.01,0.1579967975616455
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,4096,14336,2,8,1,4,power_law_1.01,0.18853119611740113
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,4096,14336,2,8,1,4,balanced,0.07396799822648366
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,4096,14336,2,8,1,4,balanced,0.11416533589363098
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,4096,14336,2,8,1,4,power_law_1.01,0.1911936044692993
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,4096,14336,2,8,1,4,balanced,0.1172320048014323
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,4096,14336,2,8,1,4,power_law_1.01,0.20556800365447997
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,4096,14336,2,8,1,4,balanced,0.11801600456237793
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,4096,14336,2,8,1,4,power_law_1.01,0.24072320461273194
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,4096,14336,2,8,1,4,balanced,0.11924800276756287
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,4096,14336,2,8,1,4,power_law_1.01,0.21434240341186522
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,4096,14336,2,8,1,4,balanced,0.12122133374214172
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,4096,14336,2,8,1,4,power_law_1.01,0.22829439640045165
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,4096,14336,2,8,1,4,balanced,0.12056000034014384
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,4096,14336,2,8,1,4,power_law_1.01,0.25496959686279297
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,4096,14336,2,8,1,4,power_law_1.01,0.2689728021621704
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,4096,14336,2,8,1,4,power_law_1.01,0.3283776044845581
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,4096,14336,2,8,1,4,balanced,0.13179733355840048
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,4096,14336,2,8,1,4,power_law_1.01,0.3207040071487427
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,4096,14336,2,8,1,4,balanced,0.13191999991734824
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,4096,14336,2,8,1,4,power_law_1.01,0.2839807987213135
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,4096,14336,2,8,1,4,power_law_1.01,0.32832000255584715
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,4096,14336,2,8,1,4,power_law_1.01,0.10705920457839965
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,4096,14336,2,8,1,4,power_law_1.01,0.39723520278930663
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,4096,14336,2,8,1,4,power_law_1.01,0.08829439878463745
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,4096,14336,2,8,1,4,power_law_1.01,0.46273279190063477
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,4096,14336,2,8,1,4,power_law_1.01,0.08848000168800355
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,4096,14336,2,8,1,4,power_law_1.01,0.6179711818695068
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,4096,14336,2,8,1,4,power_law_1.01,0.11923199892044067
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,4096,14336,2,8,1,4,power_law_1.01,0.09717760086059571
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,4096,14336,2,8,1,4,balanced,0.12702932953834534
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,4096,14336,2,8,1,4,power_law_1.01,0.7946559906005859
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,4096,14336,2,8,1,4,power_law_1.01,0.12041599750518799
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,4096,14336,2,8,1,4,power_law_1.01,0.09778559803962708
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,4096,14336,2,8,1,4,balanced,0.12938666343688965
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,4096,14336,2,8,1,4,power_law_1.01,1.1386816024780273
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,4096,14336,2,8,1,4,power_law_1.01,0.1304703950881958
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,4096,14336,2,8,1,4,power_law_1.01,0.09768959879875183
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,4096,14336,2,8,1,4,balanced,0.13295466701189676
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,4096,14336,2,8,1,4,power_law_1.01,1.2247488021850585
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,4096,14336,2,8,1,4,power_law_1.01,0.1362239956855774
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,4096,14336,2,8,1,4,power_law_1.01,0.11751680374145508
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,4096,14336,2,8,1,4,balanced,0.13386666774749756
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,4096,14336,2,8,1,4,power_law_1.01,1.9766271591186524
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,4096,14336,2,8,1,4,power_law_1.01,0.1360576033592224
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,4096,14336,2,8,1,4,power_law_1.01,0.11804159879684448
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,4096,14336,2,8,1,4,power_law_1.01,3.0131647109985353
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,4096,14336,2,8,1,4,power_law_1.01,0.1478592038154602
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,4096,14336,2,8,1,4,power_law_1.01,0.13063679933547973
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,4096,14336,2,8,1,4,power_law_1.01,0.14730240106582643
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,4096,14336,2,8,1,4,power_law_1.01,0.14991999864578248
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,4096,14336,2,8,1,4,power_law_1.01,3.4469505310058595
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,4096,14336,2,8,1,4,power_law_1.01,0.14572160243988036
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,4096,14336,2,8,1,4,power_law_1.01,0.16287360191345215
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,4096,14336,2,8,1,4,power_law_1.2,0.1842687964439392
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,4096,14336,2,8,1,4,power_law_1.01,4.363302230834961
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,4096,14336,2,8,1,4,power_law_1.01,0.15966720581054689
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,4096,14336,2,8,1,4,balanced,0.1488640010356903
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,4096,14336,2,8,1,4,power_law_1.2,0.18619519472122192
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,4096,14336,2,8,1,4,power_law_1.01,0.15548800230026244
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,4096,14336,2,8,1,4,power_law_1.01,7.452838134765625
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,4096,14336,2,8,1,4,power_law_1.2,0.15752960443496705
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,4096,14336,2,8,1,4,power_law_1.01,0.19051519632339478
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,4096,14336,2,8,1,4,balanced,0.15314132968584696
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,4096,14336,2,8,1,4,power_law_1.2,0.18780800104141235
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,4096,14336,2,8,1,4,power_law_1.01,0.1719231963157654
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,4096,14336,2,8,1,4,power_law_1.01,0.19315199851989745
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,4096,14336,2,8,1,4,balanced,0.15818132956822714
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,4096,14336,2,8,1,4,power_law_1.01,6.477881622314453
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,4096,14336,2,8,1,4,power_law_1.2,0.19052799940109252
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,4096,14336,2,8,1,4,power_law_1.2,0.203603196144104
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,4096,14336,2,8,1,4,power_law_1.01,0.2621056079864502
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,4096,14336,2,8,1,4,balanced,0.22084800402323404
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,4096,14336,2,8,1,4,power_law_1.2,0.2511744022369385
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,4096,14336,2,8,1,4,power_law_1.01,0.27467520236968995
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,4096,14336,2,8,1,4,balanced,0.2344640096028646
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,4096,14336,2,8,1,4,power_law_1.01,14.22144012451172
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,4096,14336,2,8,1,4,power_law_1.01,0.15924479961395263
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,4096,14336,2,8,1,4,power_law_1.2,0.2165247917175293
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,4096,14336,2,8,1,4,power_law_1.2,0.23267199993133544
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,4096,14336,2,8,1,4,power_law_1.01,0.2573823928833008
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,4096,14336,2,8,1,4,power_law_1.01,0.17790720462799073
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,4096,14336,2,8,1,4,power_law_1.2,0.2703295946121216
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,4096,14336,2,8,1,4,power_law_1.01,0.3221695899963379
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,4096,14336,2,8,1,4,power_law_1.01,18.361235046386717
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,4096,14336,2,8,1,4,power_law_1.01,0.18881920576095582
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,4096,14336,2,8,1,4,power_law_1.2,0.2809983968734741
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,4096,14336,2,8,1,4,power_law_1.2,0.4046463966369629
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,4096,14336,2,8,1,4,power_law_1.01,0.39470078945159914
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,4096,14336,2,8,1,4,power_law_1.01,0.2414400100708008
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,4096,14336,2,8,1,4,power_law_1.2,0.39774720668792723
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,4096,14336,2,8,1,4,power_law_1.01,0.5220608234405517
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,4096,14336,2,8,1,4,power_law_1.2,0.3090303897857666
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,4096,14336,2,8,1,4,power_law_1.2,0.3662976026535034
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,4096,14336,2,8,1,4,power_law_1.01,0.7135039806365967
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,4096,14336,2,8,1,4,power_law_1.01,38.79056091308594
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,4096,14336,2,8,1,4,power_law_1.01,0.22560639381408693
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,4096,14336,2,8,1,4,power_law_1.2,0.4067967891693115
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,4096,14336,2,8,1,4,balanced,0.3508319854736328
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,4096,14336,2,8,1,4,power_law_1.01,1.344159984588623
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,4096,14336,2,8,1,4,power_law_1.2,0.45255041122436523
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,4096,14336,2,8,1,4,power_law_1.01,0.2990976095199585
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,4096,14336,2,8,1,4,power_law_1.2,0.48888320922851564
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,4096,14336,2,8,1,4,power_law_1.01,1.4656255722045899
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,4096,14336,2,8,1,4,balanced,0.44547200202941895
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,4096,14336,2,8,1,4,power_law_1.2,0.7746751785278321
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,4096,14336,2,8,1,4,power_law_1.01,0.33966081142425536
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,4096,14336,2,8,1,4,power_law_1.01,1.974086380004883
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,4096,14336,2,8,1,4,power_law_1.2,1.152556800842285
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,4096,14336,2,8,1,4,balanced,0.6737866401672363
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,4096,14336,2,8,1,4,power_law_1.01,0.48599681854248045
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,4096,14336,2,8,1,4,power_law_1.2,0.12403199672698975
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,4096,14336,2,8,1,4,power_law_1.2,1.34202241897583
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,4096,14336,2,8,1,4,power_law_1.01,2.759449577331543
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,4096,14336,2,8,1,4,power_law_1.01,0.5406911849975586
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,4096,14336,2,8,1,4,balanced,0.8906026681264242
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,4096,14336,2,8,1,4,power_law_1.2,2.1625919342041016
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,4096,14336,2,8,1,4,power_law_1.2,0.11429120302200317
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,4096,14336,2,8,1,4,power_law_1.2,2.658188819885254
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,4096,14336,2,8,1,4,power_law_1.01,3.685843276977539
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,4096,14336,2,8,1,4,balanced,1.3329599698384602
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,4096,14336,2,8,1,4,power_law_1.2,0.12142080068588257
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,4096,14336,2,8,1,4,power_law_1.2,4.256806564331055
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,4096,14336,2,8,1,4,power_law_1.01,5.380851364135742
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,4096,14336,2,8,1,4,power_law_1.2,0.11155840158462524
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,4096,14336,2,8,1,4,power_law_1.01,0.7709504127502441
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,4096,14336,2,8,1,4,power_law_1.2,6.041785430908203
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,4096,14336,2,8,1,4,balanced,1.77675199508667
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,4096,14336,2,8,1,4,power_law_1.01,1.1310848236083983
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,4096,14336,2,8,1,4,power_law_1.2,7.084754943847656
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,4096,14336,2,8,1,4,power_law_1.01,7.743981170654297
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,4096,14336,2,8,1,4,power_law_1.2,0.12065919637680053
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,4096,14336,2,8,1,4,power_law_1.01,1.8872640609741211
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,4096,14336,2,8,1,4,power_law_1.2,9.959366607666016
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,4096,14336,2,8,1,4,power_law_1.2,0.12375680208206177
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,4096,14336,2,8,1,4,balanced,2.6533279418945312
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,4096,14336,2,8,1,4,power_law_1.01,11.954771423339844
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,4096,14336,2,8,1,4,power_law_1.01,2.438559913635254
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,4096,14336,2,8,1,4,power_law_1.2,0.13919999599456787
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,4096,14336,2,8,1,4,power_law_1.2,14.409356689453125
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,4096,14336,2,8,1,4,power_law_1.01,3.212192153930664
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,4096,14336,2,8,1,4,power_law_1.2,0.13916800022125245
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,4096,14336,2,8,1,4,power_law_1.01,23.250022888183594
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,4096,14336,2,8,1,4,balanced,3.529722531636556
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,4096,14336,2,8,1,4,power_law_1.2,0.09721599817276001
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,4096,14336,2,8,1,4,power_law_1.2,0.145414400100708
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,4096,14336,2,8,1,4,power_law_1.01,4.018156814575195
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,4096,14336,2,8,1,4,power_law_1.2,23.891865539550782
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,4096,14336,2,8,1,4,power_law_1.2,0.11338880062103271
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,4096,14336,2,8,1,4,power_law_1.2,0.15367679595947265
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,4096,14336,2,8,1,4,power_law_1.01,7.1797630310058596
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,4096,14336,2,8,1,4,power_law_1.2,0.10586240291595458
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,4096,14336,2,8,1,4,power_law_1.2,0.14690560102462769
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,4096,14336,2,8,1,4,balanced,4.404533386230469
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,4096,14336,2,8,1,4,power_law_1.2,0.11662080287933349
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,4096,14336,2,8,1,4,power_law_1.2,0.16953599452972412
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,4096,14336,2,8,1,4,power_law_1.01,10.953485107421875
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,4096,14336,2,8,2,2,balanced,0.08226666847864787
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,4096,14336,2,8,1,4,power_law_1.2,43.18004455566406
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,4096,14336,2,8,1,4,power_law_1.2,0.11801600456237793
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,4096,14336,2,8,1,4,power_law_1.2,0.1637760043144226
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,4096,14336,2,8,2,2,balanced,0.10466667016347249
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,4096,14336,2,8,1,4,power_law_1.01,12.317247772216797
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,4096,14336,2,8,1,4,power_law_1.2,0.13460479974746703
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,4096,14336,2,8,1,4,power_law_1.2,0.21799681186676026
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,4096,14336,2,8,2,2,balanced,0.18572266896565756
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,4096,14336,2,8,1,4,power_law_1.2,0.1416383981704712
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,4096,14336,2,8,1,4,balanced,7.059263865152995
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,4096,14336,2,8,1,4,power_law_1.2,0.26319360733032227
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,4096,14336,2,8,2,2,balanced,0.1895093321800232
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,4096,14336,2,8,1,4,power_law_1.2,0.16808320283889772
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,4096,14336,2,8,1,4,power_law_1.01,23.98070373535156
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,4096,14336,2,8,1,4,power_law_1.2,0.2658623933792114
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,4096,14336,2,8,2,2,balanced,0.18941332896550497
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,4096,14336,2,8,2,2,balanced,0.1911840041478475
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,4096,14336,2,8,1,4,power_law_1.2,0.2635711908340454
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,4096,14336,2,8,1,4,power_law_1.2,0.1663424015045166
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,4096,14336,2,8,2,2,balanced,0.19209599494934082
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,4096,14336,2,8,1,4,power_law_1.2,0.17496960163116454
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,4096,14336,2,8,1,4,power_law_1.2,0.32892160415649413
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,4096,14336,2,8,2,2,balanced,0.1928106745084127
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,4096,14336,2,8,1,4,power_law_1.01,46.60599060058594
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,4096,14336,2,8,1,4,power_law_1.2,0.43128318786621095
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,4096,14336,2,8,2,2,balanced,0.20187199115753174
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,4096,14336,2,8,2,2,balanced,0.20054932435353598
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,4096,14336,2,8,1,4,power_law_1.2,0.6159679889678955
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,4096,14336,2,8,1,4,power_law_1.2,0.1618175983428955
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,4096,14336,2,8,2,2,balanced,0.20535467068354288
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,4096,14336,2,8,1,4,power_law_1.2,0.7742080211639404
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,4096,14336,2,8,1,4,balanced,14.25069808959961
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,4096,14336,2,8,1,4,power_law_1.2,0.17397119998931884
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,4096,14336,2,8,2,2,balanced,0.2132533391316732
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,4096,14336,2,8,1,4,power_law_1.2,1.1473024368286133
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,4096,14336,2,8,1,4,power_law_1.2,0.1966655969619751
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,4096,14336,2,8,2,2,balanced,0.2158613403638204
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,4096,14336,2,8,1,4,power_law_1.2,1.5240896224975586
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,4096,14336,2,8,1,4,power_law_1.2,0.2169856071472168
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,4096,14336,2,8,2,2,balanced,0.22645866870880127
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,4096,14336,2,8,1,4,power_law_1.2,1.9902847290039063
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,4096,14336,2,8,2,2,balanced,0.22672533988952637
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,4096,14336,2,8,1,4,power_law_1.2,3.327417755126953
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,4096,14336,2,8,1,4,power_law_1.2,0.24355199337005615
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,4096,14336,2,8,2,2,balanced,0.22684266169865927
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,4096,14336,2,8,1,4,power_law_1.2,3.9857406616210938
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,4096,14336,2,8,1,4,power_law_1.2,0.2563391923904419
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,4096,14336,2,8,2,2,balanced,0.24445867538452148
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,4096,14336,2,8,1,4,power_law_1.2,0.3212671995162964
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,4096,14336,2,8,1,4,power_law_1.2,7.027302551269531
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,4096,14336,2,8,2,2,balanced,0.3120853304862976
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,4096,14336,2,8,1,4,power_law_1.2,0.4931136131286621
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,4096,14336,2,8,2,2,balanced,0.3495519955952962
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,4096,14336,2,8,1,4,power_law_1.2,7.73974380493164
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,4096,14336,2,8,1,4,power_law_1.2,0.5076543807983398
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,4096,14336,2,8,2,2,balanced,0.47812267144521076
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,4096,14336,2,8,1,4,power_law_1.2,12.474694061279298
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,4096,14336,2,8,2,2,balanced,0.4954506556193034
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,4096,14336,2,8,1,4,power_law_1.2,0.9796223640441895
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,4096,14336,2,8,2,2,balanced,0.7359253565470377
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,4096,14336,2,8,1,4,power_law_1.2,1.3998720169067382
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,4096,14336,2,8,1,4,power_law_1.2,22.173606872558594
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,4096,14336,2,8,1,4,power_law_1.2,1.9203584671020508
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,4096,14336,2,8,2,2,balanced,0.9399200280507406
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,4096,14336,2,8,1,4,power_law_1.2,2.420806312561035
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,4096,14336,2,8,2,2,balanced,1.3885599772135417
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,4096,14336,2,8,1,4,power_law_1.2,3.9249408721923826
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,4096,14336,2,8,1,4,power_law_1.2,5.036608123779297
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,4096,14336,2,8,2,2,balanced,1.8207093874613445
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,4096,14336,2,8,1,4,power_law_1.2,6.469132995605468
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,4096,14336,2,8,2,2,balanced,2.6689014434814453
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,4096,14336,2,8,1,4,power_law_1.2,9.078009796142577
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,4096,14336,2,8,1,4,power_law_1.2,15.828492736816406
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,4096,14336,2,8,2,2,balanced,3.5898240407307944
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,4096,14336,2,8,1,4,power_law_1.2,19.408563232421876
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,4096,14336,2,8,2,2,balanced,4.463962554931641
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,4096,14336,2,8,1,4,power_law_1.2,47.87948303222656
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,4096,14336,2,8,2,2,balanced,7.41917355855306
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,4096,14336,2,8,2,2,balanced,0.05691199998060862
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,4096,14336,2,8,2,2,balanced,0.07332799832026164
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,4096,14336,2,8,2,2,balanced,0.11272000273068745
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,4096,14336,2,8,2,2,balanced,0.11616533001263936
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,4096,14336,2,8,2,2,balanced,0.11760000387827556
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,4096,14336,2,8,2,2,balanced,0.11867200334866841
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,4096,14336,2,8,2,2,balanced,0.11966933806737264
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,4096,14336,2,8,2,2,balanced,15.018741607666016
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,4096,14336,2,8,2,2,balanced,0.12086400389671326
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,4096,14336,2,8,2,2,balanced,0.12152533729871114
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,4096,14336,2,8,2,2,balanced,0.12377066413561504
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,4096,14336,2,8,2,2,balanced,0.12662399808565775
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,4096,14336,2,8,2,2,balanced,0.12685333689053854
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,4096,14336,2,8,2,2,balanced,0.12770666678746542
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,4096,14336,2,8,2,2,balanced,0.047914668917655945
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,4096,14336,2,8,2,2,power_law_1.01,0.09834240078926086
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,4096,14336,2,8,2,2,balanced,0.1395786702632904
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,4096,14336,2,8,2,2,balanced,0.067221333583196
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,4096,14336,2,8,2,2,balanced,0.14482133587201437
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,4096,14336,2,8,2,2,power_law_1.01,0.12312320470809937
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,4096,14336,2,8,2,2,balanced,0.10965333382288615
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,4096,14336,2,8,2,2,balanced,0.11271466811498006
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,4096,14336,2,8,2,2,balanced,0.14784533778826395
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,4096,14336,2,8,2,2,power_law_1.01,0.13320959806442262
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,4096,14336,2,8,2,2,balanced,0.11377066373825073
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,4096,14336,2,8,2,2,balanced,0.1150933305422465
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,4096,14336,2,8,2,2,balanced,0.15836800138155618
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,4096,14336,2,8,2,2,power_law_1.01,0.18803839683532714
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,4096,14336,2,8,2,2,balanced,0.11653866370519002
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,4096,14336,2,8,2,2,balanced,0.11782933274904887
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,4096,14336,2,8,2,2,power_law_1.01,0.18821760416030883
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,4096,14336,2,8,2,2,balanced,0.1955146590868632
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,4096,14336,2,8,2,2,balanced,0.20879999796549478
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,4096,14336,2,8,2,2,power_law_1.01,0.19680639505386352
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,4096,14336,2,8,2,2,balanced,0.28119999170303345
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,4096,14336,2,8,2,2,power_law_1.01,0.2079616069793701
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,4096,14336,2,8,2,2,power_law_1.01,0.06824960112571717
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,4096,14336,2,8,2,2,power_law_1.01,0.21899518966674805
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,4096,14336,2,8,2,2,balanced,0.32331732908884686
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,4096,14336,2,8,2,2,balanced,0.1202880044778188
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,4096,14336,2,8,2,2,power_law_1.01,0.08021119832992554
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,4096,14336,2,8,2,2,power_law_1.01,0.2466559886932373
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,4096,14336,2,8,2,2,balanced,0.47060267130533856
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,4096,14336,2,8,2,2,balanced,0.12212266524632771
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,4096,14336,2,8,2,2,power_law_1.01,0.07559040188789368
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,4096,14336,2,8,2,2,power_law_1.01,0.25365118980407714
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,4096,14336,2,8,2,2,balanced,0.5982240041097006
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,4096,14336,2,8,2,2,power_law_1.01,0.1155519962310791
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,4096,14336,2,8,2,2,power_law_1.01,0.2381056070327759
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,4096,14336,2,8,2,2,power_law_1.01,0.11623040437698365
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,4096,14336,2,8,2,2,balanced,0.8704426288604736
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,4096,14336,2,8,2,2,power_law_1.01,0.27012479305267334
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,4096,14336,2,8,2,2,power_law_1.01,0.12362240552902222
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,4096,14336,2,8,2,2,power_law_1.01,0.13199360370635987
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,4096,14336,2,8,2,2,power_law_1.01,0.28324480056762696
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,4096,14336,2,8,2,2,balanced,1.1395946343739827
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,4096,14336,2,8,2,2,power_law_1.01,0.12949759960174562
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,4096,14336,2,8,2,2,power_law_1.01,0.293503999710083
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,4096,14336,2,8,2,2,balanced,0.1251253286997477
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,4096,14336,2,8,2,2,power_law_1.01,0.1348863959312439
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,4096,14336,2,8,2,2,power_law_1.01,0.3193023920059204
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,4096,14336,2,8,2,2,balanced,0.1281760036945343
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,4096,14336,2,8,2,2,balanced,1.6699840227762859
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,4096,14336,2,8,2,2,balanced,0.1322879989941915
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,4096,14336,2,8,2,2,power_law_1.01,0.13864959478378297
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,4096,14336,2,8,2,2,power_law_1.01,0.2991552114486694
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,4096,14336,2,8,2,2,balanced,0.13378666838010153
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,4096,14336,2,8,2,2,power_law_1.01,0.13957760334014893
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,4096,14336,2,8,2,2,power_law_1.01,0.060172802209854125
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,4096,14336,2,8,2,2,power_law_1.01,0.3296063899993896
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,4096,14336,2,8,2,2,balanced,2.211568037668864
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,4096,14336,2,8,2,2,power_law_1.01,0.14291839599609374
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,4096,14336,2,8,2,2,power_law_1.01,0.0763264000415802
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,4096,14336,2,8,2,2,power_law_1.01,0.418720006942749
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,4096,14336,2,8,2,2,power_law_1.01,0.14847999811172485
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,4096,14336,2,8,2,2,power_law_1.01,0.08472319841384887
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,4096,14336,2,8,2,2,power_law_1.01,0.5466944217681885
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,4096,14336,2,8,2,2,balanced,0.14969600240389505
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,4096,14336,2,8,2,2,power_law_1.01,0.17356159687042236
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,4096,14336,2,8,2,2,power_law_1.01,0.11328639984130859
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,4096,14336,2,8,2,2,balanced,0.1543786625067393
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,4096,14336,2,8,2,2,power_law_1.01,0.7445631980895996
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,4096,14336,2,8,2,2,balanced,2.739749272664388
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,4096,14336,2,8,2,2,power_law_1.01,0.177183997631073
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,4096,14336,2,8,2,2,power_law_1.01,0.1142848014831543
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,4096,14336,2,8,2,2,balanced,0.16236799955368042
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,4096,14336,2,8,2,2,power_law_1.01,0.8078463554382325
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,4096,14336,2,8,2,2,balanced,0.234224001566569
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,4096,14336,2,8,2,2,power_law_1.01,0.19123200178146363
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,4096,14336,2,8,2,2,power_law_1.01,0.12003200054168701
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,4096,14336,2,8,2,2,power_law_1.01,1.207750415802002
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,4096,14336,2,8,2,2,balanced,0.25114667415618896
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,4096,14336,2,8,2,2,power_law_1.01,0.18988159894943238
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,4096,14336,2,8,2,2,power_law_1.01,0.1370687961578369
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,4096,14336,2,8,2,2,power_law_1.01,1.377401638031006
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,4096,14336,2,8,2,2,power_law_1.01,0.24817919731140137
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,4096,14336,2,8,2,2,balanced,4.402794520060222
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,4096,14336,2,8,2,2,power_law_1.01,0.1441472053527832
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,4096,14336,2,8,2,2,power_law_1.01,2.446816062927246
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,4096,14336,2,8,2,2,power_law_1.01,0.32565760612487793
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,4096,14336,2,8,2,2,power_law_1.01,3.1815679550170897
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,4096,14336,2,8,2,2,power_law_1.01,0.45493121147155763
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,4096,14336,2,8,2,2,balanced,0.3688266674677531
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,4096,14336,2,8,2,2,power_law_1.2,0.09871360063552856
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,4096,14336,2,8,2,2,power_law_1.01,0.14324480295181274
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,4096,14336,2,8,2,2,power_law_1.01,0.4862847805023193
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,4096,14336,2,8,2,2,balanced,0.48389331499735516
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,4096,14336,2,8,2,2,power_law_1.01,4.513382339477539
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,4096,14336,2,8,2,2,power_law_1.2,0.10675840377807617
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,4096,14336,2,8,2,2,power_law_1.01,0.14883840084075928
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,4096,14336,2,8,2,2,balanced,0.7353759606679281
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,4096,14336,2,8,2,2,power_law_1.01,0.6465280055999756
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,4096,14336,2,8,2,2,power_law_1.2,0.12295680046081543
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,4096,14336,2,8,2,2,power_law_1.01,6.010681533813477
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,4096,14336,2,8,2,2,balanced,0.9944106737772623
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,4096,14336,2,8,2,2,power_law_1.2,0.188864004611969
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,4096,14336,2,8,2,2,power_law_1.01,0.9277503967285157
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,4096,14336,2,8,2,2,power_law_1.01,6.885043334960938
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,4096,14336,2,8,2,2,power_law_1.2,0.18196480274200438
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,4096,14336,2,8,2,2,balanced,1.4786826769510906
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,4096,14336,2,8,2,2,power_law_1.01,1.066431999206543
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,4096,14336,2,8,2,2,power_law_1.01,0.1488703966140747
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,4096,14336,2,8,2,2,balanced,8.662192026774088
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,4096,14336,2,8,2,2,power_law_1.2,0.19260159730911255
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,4096,14336,2,8,2,2,power_law_1.01,1.51843204498291
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,4096,14336,2,8,2,2,power_law_1.01,0.1622655987739563
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,4096,14336,2,8,2,2,balanced,1.9549066225687664
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,4096,14336,2,8,2,2,power_law_1.01,11.61962890625
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,4096,14336,2,8,2,2,power_law_1.2,0.2206592082977295
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,4096,14336,2,8,2,2,power_law_1.01,2.732307243347168
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,4096,14336,2,8,2,2,power_law_1.01,0.16162559986114503
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,4096,14336,2,8,2,2,power_law_1.2,0.23832321166992188
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,4096,14336,2,8,2,2,balanced,2.9121599197387695
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,4096,14336,2,8,2,2,power_law_1.01,0.17978880405426026
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,4096,14336,2,8,2,2,power_law_1.01,3.3192703247070314
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,4096,14336,2,8,2,2,power_law_1.2,0.2512383937835693
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,4096,14336,2,8,2,2,power_law_1.01,23.08452453613281
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,4096,14336,2,8,2,2,power_law_1.2,0.24737279415130614
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,4096,14336,2,8,2,2,power_law_1.01,4.5077056884765625
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,4096,14336,2,8,2,2,power_law_1.01,0.19674880504608155
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,4096,14336,2,8,2,2,balanced,3.86409060160319
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,4096,14336,2,8,2,2,power_law_1.2,0.239136004447937
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,4096,14336,2,8,2,2,power_law_1.01,6.869068908691406
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,4096,14336,2,8,2,2,power_law_1.01,0.20110719203948973
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,4096,14336,2,8,2,2,power_law_1.2,0.26449921131134035
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,4096,14336,2,8,2,2,power_law_1.01,0.24792320728302003
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,4096,14336,2,8,2,2,power_law_1.2,0.28888959884643556
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,4096,14336,2,8,2,2,power_law_1.01,13.433485412597657
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,4096,14336,2,8,2,2,balanced,4.801168123881022
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,4096,14336,2,8,2,2,power_law_1.01,0.315449595451355
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,4096,14336,2,8,2,2,power_law_1.2,0.2981503963470459
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,4096,14336,2,8,2,2,power_law_1.2,0.07157120108604431
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,4096,14336,2,8,2,2,power_law_1.01,0.4519552230834961
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,4096,14336,2,8,2,2,power_law_1.2,0.29731199741363523
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,4096,14336,2,8,2,2,power_law_1.2,0.07637119889259339
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,4096,14336,2,8,2,2,power_law_1.2,0.2953792095184326
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,4096,14336,2,8,2,2,power_law_1.01,0.5936511993408203
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,4096,14336,2,8,2,2,power_law_1.2,0.08840320110321045
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,4096,14336,2,8,2,2,balanced,7.695226669311523
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,4096,14336,2,8,2,2,power_law_1.2,0.312390398979187
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,4096,14336,2,8,2,2,power_law_1.2,0.1160256028175354
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,4096,14336,2,8,2,2,power_law_1.01,0.6927680015563965
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,4096,14336,2,8,2,2,power_law_1.2,0.40595197677612305
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,4096,14336,2,8,2,2,power_law_1.2,0.11640959978103638
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,4096,14336,2,8,2,2,power_law_1.01,1.1309120178222656
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,4096,14336,2,8,2,2,power_law_1.2,0.1240447998046875
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,4096,14336,2,8,2,2,power_law_1.2,0.5672639846801758
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,4096,14336,2,8,2,2,power_law_1.01,1.3680447578430175
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,4096,14336,2,8,2,2,power_law_1.2,0.13301759958267212
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,4096,14336,2,8,2,2,power_law_1.2,0.7263296127319336
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,4096,14336,2,8,2,2,power_law_1.01,2.2018943786621095
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,4096,14336,2,8,2,2,power_law_1.2,0.13240959644317626
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,4096,14336,2,8,2,2,power_law_1.2,0.8030783653259277
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,4096,14336,2,8,2,2,power_law_1.01,3.248089599609375
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,4096,14336,2,8,2,2,power_law_1.2,0.1373311996459961
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,4096,14336,2,8,2,2,power_law_1.2,1.307744026184082
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,4096,14336,2,8,2,2,balanced,15.435493469238281
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,4096,14336,2,8,2,2,power_law_1.01,4.649504089355469
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,4096,14336,2,8,2,2,power_law_1.2,0.13698559999465942
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,4096,14336,2,8,2,2,power_law_1.2,0.059596800804138185
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,4096,14336,2,8,2,2,power_law_1.2,1.6522943496704101
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,4096,14336,2,8,2,2,power_law_1.2,0.138099205493927
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,4096,14336,2,8,2,2,power_law_1.01,6.109401702880859
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,4096,14336,2,8,2,2,power_law_1.2,1.8380735397338868
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,4096,14336,2,8,2,2,power_law_1.2,0.06852480173110961
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,4096,14336,2,8,2,2,power_law_1.2,0.14864640235900878
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,4096,14336,2,8,2,2,power_law_1.2,0.07621759772300721
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,4096,14336,2,8,2,2,power_law_1.2,3.236646270751953
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,4096,14336,2,8,2,2,power_law_1.01,7.4509437561035154
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,4096,14336,2,8,2,2,power_law_1.2,0.15199999809265136
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,4096,14336,2,8,2,2,power_law_1.2,0.11316479444503784
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,4096,14336,2,8,2,2,power_law_1.2,4.734246444702149
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,4096,14336,2,8,2,2,power_law_1.2,0.174835205078125
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,4096,14336,2,8,2,2,power_law_1.2,0.10977920293807983
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,4096,14336,2,8,2,2,power_law_1.01,12.73038101196289
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,4096,14336,2,8,2,2,power_law_1.2,0.18035839796066283
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,4096,14336,2,8,2,2,power_law_1.2,5.445196914672851
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,4096,14336,2,8,2,2,power_law_1.2,0.12706559896469116
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,4096,14336,2,8,2,2,power_law_1.2,0.19096959829330445
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,4096,14336,2,8,2,2,power_law_1.2,0.1336832046508789
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,4096,14336,2,8,2,2,power_law_1.2,9.137881469726562
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,4096,14336,2,8,2,2,power_law_1.01,21.883935546875
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,4096,14336,2,8,2,2,power_law_1.2,0.19937280416488648
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,4096,14336,2,8,2,2,power_law_1.2,0.1434048056602478
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,4096,14336,2,8,2,2,power_law_1.2,0.25736958980560304
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,4096,14336,2,8,2,2,power_law_1.2,13.275436401367188
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,4096,14336,2,8,2,2,power_law_1.2,0.33850879669189454
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,4096,14336,2,8,2,2,power_law_1.2,0.43680639266967775
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,4096,14336,2,8,2,2,power_law_1.2,0.14487680196762084
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,4096,14336,2,8,2,2,power_law_1.2,22.5229248046875
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,4096,14336,2,8,2,2,power_law_1.2,0.1546880006790161
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,4096,14336,2,8,2,2,power_law_1.2,0.5422848224639892
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,4096,14336,2,8,2,2,power_law_1.2,0.6827775955200195
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,4096,14336,2,8,2,2,power_law_1.2,0.9029696464538575
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,4096,14336,2,8,2,2,power_law_1.2,0.14935679435729982
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,4096,14336,2,8,2,2,power_law_1.2,1.48155517578125
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,4096,14336,2,8,2,2,power_law_1.2,0.15113600492477416
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,4096,14336,2,8,2,2,power_law_1.2,0.16108800172805787
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,4096,14336,2,8,2,2,power_law_1.2,1.7618047714233398
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,4096,14336,2,8,2,2,power_law_1.2,0.17950719594955444
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,4096,14336,2,8,2,2,power_law_1.2,2.841676712036133
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,4096,14336,2,8,2,2,power_law_1.2,4.024959945678711
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,4096,14336,2,8,2,2,power_law_1.2,0.19812480211257935
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,4096,14336,2,8,2,2,power_law_1.2,4.643014526367187
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,4096,14336,2,8,2,2,power_law_1.2,0.21431679725646974
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,4096,14336,2,8,2,2,power_law_1.2,0.241593599319458
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,4096,14336,2,8,2,2,power_law_1.2,7.914246368408203
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,4096,14336,2,8,2,2,power_law_1.2,0.32914559841156005
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,4096,14336,2,8,2,2,power_law_1.2,0.4515711784362793
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,4096,14336,2,8,2,2,power_law_1.2,13.290208435058593
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,4096,14336,2,8,2,2,power_law_1.2,0.6294079780578613
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,4096,14336,2,8,2,2,power_law_1.2,0.8190336227416992
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,4096,14336,2,8,2,2,power_law_1.2,1.221459197998047
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,4096,14336,2,8,2,2,power_law_1.2,1.6404224395751954
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,4096,14336,2,8,2,2,power_law_1.2,2.735366439819336
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,4096,14336,2,8,2,2,power_law_1.2,3.1357311248779296
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,4096,14336,2,8,2,2,power_law_1.2,4.321900939941406
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,4096,14336,2,8,2,2,power_law_1.2,6.210047912597656
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,4096,14336,2,8,2,2,power_law_1.2,7.6992637634277346
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,4096,14336,2,8,2,2,power_law_1.2,11.383827209472656
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,4096,14336,2,8,2,2,power_law_1.2,26.447360229492187
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,4096,14336,2,8,4,1,balanced,0.07251200079917908
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,4096,14336,2,8,4,1,balanced,0.05420266588528951
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,4096,14336,2,8,4,1,balanced,0.105103999376297
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,4096,14336,2,8,4,1,balanced,0.07107733190059662
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,4096,14336,2,8,4,1,balanced,0.18556799491246542
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,4096,14336,2,8,4,1,balanced,0.11292800307273865
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,4096,14336,2,8,4,1,balanced,0.18834133942921957
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,4096,14336,2,8,4,1,balanced,0.11503466963768005
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,4096,14336,2,8,4,1,balanced,0.1885653336842855
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,4096,14336,2,8,4,1,balanced,0.11568533380826314
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,4096,14336,2,8,4,1,balanced,0.19302932421366373
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,4096,14336,2,8,4,1,balanced,0.11788800358772278
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,4096,14336,2,8,4,1,balanced,0.19312000274658203
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,4096,14336,2,8,4,1,balanced,0.11986666917800903
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,4096,14336,2,8,4,1,balanced,0.19549334049224854
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,4096,14336,2,8,4,1,balanced,0.12052266796429952
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,4096,14336,2,8,4,1,balanced,0.20229866107304892
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,4096,14336,2,8,4,1,balanced,0.12153599659601848
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,4096,14336,2,8,4,1,balanced,0.2037866711616516
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,4096,14336,2,8,4,1,balanced,0.1220266620318095
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,4096,14336,2,8,4,1,balanced,0.20873600244522095
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,4096,14336,2,8,4,1,balanced,0.12637866536776224
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,4096,14336,2,8,4,1,balanced,0.20917866627375284
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,4096,14336,2,8,4,1,balanced,0.12665067116419473
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,4096,14336,2,8,4,1,power_law_1.01,0.06549760103225707
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,4096,14336,2,8,4,1,balanced,0.12877866625785828
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,4096,14336,2,8,4,1,balanced,0.21126933892567953
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,4096,14336,2,8,4,1,power_law_1.01,0.08731520175933838
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,4096,14336,2,8,4,1,balanced,0.22252267599105835
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,4096,14336,2,8,4,1,balanced,0.13993066549301147
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,4096,14336,2,8,4,1,power_law_1.01,0.10311039686203002
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,4096,14336,2,8,4,1,balanced,0.047168001532554626
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,4096,14336,2,8,4,1,balanced,0.14736533164978027
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,4096,14336,2,8,4,1,balanced,0.23144533236821493
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,4096,14336,2,8,4,1,power_law_1.01,0.1729472041130066
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,4096,14336,2,8,4,1,balanced,0.06725866595904033
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,4096,14336,2,8,4,1,balanced,0.14891200264294943
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,4096,14336,2,8,4,1,balanced,0.23307732741038004
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,4096,14336,2,8,4,1,power_law_1.01,0.18896000385284423
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,4096,14336,2,8,4,1,balanced,0.1090613305568695
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,4096,14336,2,8,4,1,balanced,0.15558933218320212
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,4096,14336,2,8,4,1,balanced,0.2521333297093709
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,4096,14336,2,8,4,1,power_law_1.01,0.19407360553741454
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,4096,14336,2,8,4,1,balanced,0.11241599917411804
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,4096,14336,2,8,4,1,balanced,0.21579732497533163
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,4096,14336,2,8,4,1,balanced,0.3210080067316691
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,4096,14336,2,8,4,1,power_law_1.01,0.1985152006149292
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,4096,14336,2,8,4,1,balanced,0.11411199967066447
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,4096,14336,2,8,4,1,balanced,0.3209493358929952
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,4096,14336,2,8,4,1,balanced,0.21490667263666788
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,4096,14336,2,8,4,1,power_law_1.01,0.21093759536743165
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,4096,14336,2,8,4,1,balanced,0.1165173351764679
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,4096,14336,2,8,4,1,balanced,0.4399840037027995
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,4096,14336,2,8,4,1,balanced,0.29049599170684814
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,4096,14336,2,8,4,1,power_law_1.01,0.22644479274749757
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,4096,14336,2,8,4,1,balanced,0.11812800168991089
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,4096,14336,2,8,4,1,power_law_1.01,0.2321471929550171
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,4096,14336,2,8,4,1,balanced,0.11955733100573222
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,4096,14336,2,8,4,1,balanced,0.5192106564839681
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,4096,14336,2,8,4,1,balanced,0.35277867317199707
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,4096,14336,2,8,4,1,power_law_1.01,0.22188799381256102
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,4096,14336,2,8,4,1,balanced,0.7678346633911133
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,4096,14336,2,8,4,1,balanced,0.5094613234202067
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,4096,14336,2,8,4,1,power_law_1.01,0.22716159820556642
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,4096,14336,2,8,4,1,balanced,0.6415733496348063
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,4096,14336,2,8,4,1,balanced,0.975770632425944
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,4096,14336,2,8,4,1,power_law_1.01,0.051686400175094606
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,4096,14336,2,8,4,1,power_law_1.01,0.23029758930206298
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,4096,14336,2,8,4,1,power_law_1.01,0.2678272008895874
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,4096,14336,2,8,4,1,balanced,0.12204266587893169
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,4096,14336,2,8,4,1,power_law_1.01,0.06060799956321716
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,4096,14336,2,8,4,1,balanced,0.9333013693491617
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,4096,14336,2,8,4,1,balanced,1.4386240641276042
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,4096,14336,2,8,4,1,power_law_1.01,0.2972543954849243
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,4096,14336,2,8,4,1,balanced,0.12422933181126912
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,4096,14336,2,8,4,1,power_law_1.01,0.07201279997825623
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,4096,14336,2,8,4,1,power_law_1.01,0.289247989654541
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,4096,14336,2,8,4,1,balanced,1.9192533493041992
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,4096,14336,2,8,4,1,power_law_1.01,0.11347839832305909
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,4096,14336,2,8,4,1,balanced,1.2283466657002766
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,4096,14336,2,8,4,1,power_law_1.01,0.3256256103515625
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,4096,14336,2,8,4,1,power_law_1.01,0.11073919534683227
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,4096,14336,2,8,4,1,power_law_1.01,0.36676480770111086
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,4096,14336,2,8,4,1,power_law_1.01,0.11875200271606445
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,4096,14336,2,8,4,1,balanced,1.7976586023966472
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,4096,14336,2,8,4,1,balanced,2.8055359522501626
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,4096,14336,2,8,4,1,power_law_1.01,0.40497918128967286
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,4096,14336,2,8,4,1,power_law_1.01,0.12537599802017213
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,4096,14336,2,8,4,1,power_law_1.01,0.5266880035400391
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,4096,14336,2,8,4,1,power_law_1.01,0.12201600074768067
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,4096,14336,2,8,4,1,power_law_1.01,0.04593279957771301
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,4096,14336,2,8,4,1,balanced,2.3938934008280435
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,4096,14336,2,8,4,1,power_law_1.01,0.6200384140014649
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,4096,14336,2,8,4,1,balanced,3.7476320266723633
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,4096,14336,2,8,4,1,power_law_1.01,0.12821120023727417
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,4096,14336,2,8,4,1,balanced,0.12898666659990946
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,4096,14336,2,8,4,1,power_law_1.01,0.06165760159492493
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,4096,14336,2,8,4,1,power_law_1.01,0.8651455879211426
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,4096,14336,2,8,4,1,power_law_1.01,0.12804479598999025
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,4096,14336,2,8,4,1,power_law_1.01,0.07646080255508422
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,4096,14336,2,8,4,1,balanced,0.13351999719937643
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,4096,14336,2,8,4,1,power_law_1.01,1.10250883102417
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,4096,14336,2,8,4,1,power_law_1.01,0.1074944019317627
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,4096,14336,2,8,4,1,power_law_1.01,0.13292800188064574
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,4096,14336,2,8,4,1,power_law_1.01,0.11331199407577515
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,4096,14336,2,8,4,1,balanced,2.9770825703938804
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,4096,14336,2,8,4,1,balanced,0.1381013294061025
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,4096,14336,2,8,4,1,power_law_1.01,1.5484736442565918
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,4096,14336,2,8,4,1,balanced,4.609765370686849
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,4096,14336,2,8,4,1,power_law_1.01,0.13790719509124755
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,4096,14336,2,8,4,1,power_law_1.01,0.11635199785232545
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,4096,14336,2,8,4,1,balanced,0.14177599549293518
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,4096,14336,2,8,4,1,power_law_1.01,1.968320083618164
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,4096,14336,2,8,4,1,power_law_1.01,0.12532479763031007
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,4096,14336,2,8,4,1,power_law_1.01,0.13960959911346435
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,4096,14336,2,8,4,1,power_law_1.01,0.13408000469207765
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,4096,14336,2,8,4,1,power_law_1.01,2.889740753173828
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,4096,14336,2,8,4,1,power_law_1.01,0.16239360570907593
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,4096,14336,2,8,4,1,power_law_1.2,0.06578559875488281
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,4096,14336,2,8,4,1,power_law_1.01,3.8121406555175783
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,4096,14336,2,8,4,1,power_law_1.01,0.1751487970352173
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,4096,14336,2,8,4,1,power_law_1.2,0.0840448021888733
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,4096,14336,2,8,4,1,power_law_1.01,0.13187839984893798
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,4096,14336,2,8,4,1,balanced,4.631226539611816
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,4096,14336,2,8,4,1,balanced,0.1622933348019918
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,4096,14336,2,8,4,1,balanced,7.494789123535156
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,4096,14336,2,8,4,1,power_law_1.01,0.18120959997177125
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,4096,14336,2,8,4,1,power_law_1.01,0.1435968041419983
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,4096,14336,2,8,4,1,power_law_1.01,4.776409530639649
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,4096,14336,2,8,4,1,power_law_1.2,0.09940479993820191
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,4096,14336,2,8,4,1,balanced,0.16873067617416382
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,4096,14336,2,8,4,1,power_law_1.01,0.19256319999694824
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,4096,14336,2,8,4,1,power_law_1.2,0.18326400518417357
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,4096,14336,2,8,4,1,power_law_1.01,7.6764991760253904
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,4096,14336,2,8,4,1,balanced,0.17852266629536948
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,4096,14336,2,8,4,1,power_law_1.01,0.22479360103607177
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,4096,14336,2,8,4,1,power_law_1.2,0.18391679525375365
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,4096,14336,2,8,4,1,power_law_1.01,0.14095360040664673
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,4096,14336,2,8,4,1,balanced,0.25648534297943115
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,4096,14336,2,8,4,1,power_law_1.01,0.2612031936645508
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,4096,14336,2,8,4,1,power_law_1.01,0.14507520198822021
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,4096,14336,2,8,4,1,power_law_1.2,0.19531519412994386
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,4096,14336,2,8,4,1,power_law_1.01,15.286572265625
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,4096,14336,2,8,4,1,power_law_1.01,0.15537279844284058
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,4096,14336,2,8,4,1,balanced,0.27983466784159344
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,4096,14336,2,8,4,1,power_law_1.2,0.20554239749908448
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,4096,14336,2,8,4,1,power_law_1.01,0.3345024108886719
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,4096,14336,2,8,4,1,power_law_1.01,0.17503999471664428
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,4096,14336,2,8,4,1,power_law_1.2,0.21112959384918212
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,4096,14336,2,8,4,1,power_law_1.01,0.39450879096984864
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,4096,14336,2,8,4,1,power_law_1.01,0.1785215973854065
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,4096,14336,2,8,4,1,power_law_1.2,0.21924479007720948
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,4096,14336,2,8,4,1,power_law_1.01,0.5495808124542236
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,4096,14336,2,8,4,1,balanced,9.214341481526693
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,4096,14336,2,8,4,1,power_law_1.01,0.19355520009994506
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,4096,14336,2,8,4,1,power_law_1.2,0.23697919845581056
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,4096,14336,2,8,4,1,power_law_1.01,0.684607982635498
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,4096,14336,2,8,4,1,power_law_1.01,0.22394239902496338
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,4096,14336,2,8,4,1,balanced,15.306597391764322
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,4096,14336,2,8,4,1,balanced,0.4194399913152059
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,4096,14336,2,8,4,1,power_law_1.01,0.2808192014694214
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,4096,14336,2,8,4,1,power_law_1.2,0.22020480632781983
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,4096,14336,2,8,4,1,power_law_1.01,0.9680255889892578
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,4096,14336,2,8,4,1,power_law_1.01,0.3365312099456787
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,4096,14336,2,8,4,1,power_law_1.2,0.22743680477142333
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,4096,14336,2,8,4,1,balanced,0.5622666676839193
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,4096,14336,2,8,4,1,power_law_1.01,1.2436415672302246
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,4096,14336,2,8,4,1,power_law_1.01,0.47196159362792967
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,4096,14336,2,8,4,1,power_law_1.2,0.23283839225769043
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,4096,14336,2,8,4,1,balanced,0.8392213185628256
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,4096,14336,2,8,4,1,power_law_1.01,0.6160192012786865
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,4096,14336,2,8,4,1,power_law_1.01,1.8071359634399413
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,4096,14336,2,8,4,1,power_law_1.2,0.25816960334777833
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,4096,14336,2,8,4,1,power_law_1.01,0.903769588470459
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,4096,14336,2,8,4,1,power_law_1.2,0.05265920162200928
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,4096,14336,2,8,4,1,balanced,1.1069706281026204
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,4096,14336,2,8,4,1,power_law_1.01,2.4916479110717775
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,4096,14336,2,8,4,1,power_law_1.01,1.1554752349853517
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,4096,14336,2,8,4,1,power_law_1.2,0.2842303991317749
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,4096,14336,2,8,4,1,power_law_1.01,1.7028608322143555
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,4096,14336,2,8,4,1,power_law_1.2,0.06350719928741455
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,4096,14336,2,8,4,1,power_law_1.01,3.1124736785888674
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,4096,14336,2,8,4,1,power_law_1.2,0.2910207986831665
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,4096,14336,2,8,4,1,power_law_1.01,2.2068416595458986
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,4096,14336,2,8,4,1,balanced,1.6480159759521484
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,4096,14336,2,8,4,1,power_law_1.2,0.07030400037765502
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,4096,14336,2,8,4,1,power_law_1.01,3.2906879425048827
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,4096,14336,2,8,4,1,power_law_1.2,0.32133119106292723
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,4096,14336,2,8,4,1,power_law_1.01,4.655968093872071
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,4096,14336,2,8,4,1,power_law_1.2,0.11296000480651855
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,4096,14336,2,8,4,1,power_law_1.01,4.329497528076172
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,4096,14336,2,8,4,1,balanced,2.1720587412516275
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,4096,14336,2,8,4,1,power_law_1.2,0.3660351991653442
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,4096,14336,2,8,4,1,power_law_1.2,0.11472640037536622
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,4096,14336,2,8,4,1,power_law_1.01,5.3934783935546875
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,4096,14336,2,8,4,1,power_law_1.01,9.177324676513672
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,4096,14336,2,8,4,1,power_law_1.2,0.4104576110839844
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,4096,14336,2,8,4,1,power_law_1.01,8.596153259277344
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,4096,14336,2,8,4,1,power_law_1.2,0.11621760129928589
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,4096,14336,2,8,4,1,balanced,3.24347718556722
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,4096,14336,2,8,4,1,power_law_1.2,0.5147456169128418
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,4096,14336,2,8,4,1,power_law_1.2,0.12240639925003052
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,4096,14336,2,8,4,1,power_law_1.2,0.6239295959472656
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,4096,14336,2,8,4,1,power_law_1.01,17.2097412109375
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,4096,14336,2,8,4,1,power_law_1.2,0.8636096000671387
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,4096,14336,2,8,4,1,power_law_1.2,0.12325119972229004
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,4096,14336,2,8,4,1,balanced,4.31437333424886
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,4096,14336,2,8,4,1,power_law_1.2,1.0827199935913085
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,4096,14336,2,8,4,1,power_law_1.2,0.12567039728164672
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,4096,14336,2,8,4,1,power_law_1.2,1.5532352447509765
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,4096,14336,2,8,4,1,power_law_1.2,0.1274880051612854
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,4096,14336,2,8,4,1,power_law_1.2,0.13045120239257812
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,4096,14336,2,8,4,1,power_law_1.2,1.971232032775879
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,4096,14336,2,8,4,1,balanced,5.374997456868489
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,4096,14336,2,8,4,1,power_law_1.2,0.13802239894866944
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,4096,14336,2,8,4,1,power_law_1.2,2.8737024307250976
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,4096,14336,2,8,4,1,power_law_1.2,0.14090880155563354
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,4096,14336,2,8,4,1,power_law_1.2,3.8245822906494142
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,4096,14336,2,8,4,1,power_law_1.2,0.16216959953308105
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,4096,14336,2,8,4,1,power_law_1.2,4.7925056457519535
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,4096,14336,2,8,4,1,power_law_1.2,0.17760000228881836
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,4096,14336,2,8,4,1,power_law_1.2,0.1789695978164673
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,4096,14336,2,8,4,1,balanced,8.572410583496094
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,4096,14336,2,8,4,1,power_law_1.2,7.632697296142578
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,4096,14336,2,8,4,1,power_law_1.2,0.18574719429016112
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,4096,14336,2,8,4,1,power_law_1.2,0.2258239984512329
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,4096,14336,2,8,4,1,power_law_1.2,15.3383544921875
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,4096,14336,2,8,4,1,power_law_1.2,0.2585024118423462
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,4096,14336,2,8,4,1,power_law_1.2,0.3189055919647217
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,4096,14336,2,8,4,1,power_law_1.2,0.3968192100524902
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,4096,14336,2,8,4,1,power_law_1.2,0.5440959930419922
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,4096,14336,2,8,4,1,power_law_1.2,0.6948031902313232
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,4096,14336,2,8,4,1,balanced,17.211563110351562
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,4096,14336,2,8,4,1,power_law_1.2,0.9606080055236816
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,4096,14336,2,8,4,1,power_law_1.2,1.2423487663269044
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,4096,14336,2,8,4,1,power_law_1.2,1.8010688781738282
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,4096,14336,2,8,4,1,power_law_1.2,2.501625633239746
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,4096,14336,2,8,4,1,power_law_1.2,3.10516471862793
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,4096,14336,2,8,4,1,power_law_1.2,4.642771148681641
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,4096,14336,2,8,4,1,power_law_1.2,9.215821075439454
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,4096,14336,2,8,4,1,power_law_1.2,0.04567680060863495
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,4096,14336,2,8,4,1,power_law_1.2,0.05852159857749939
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,4096,14336,2,8,4,1,power_law_1.2,0.061484801769256595
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,4096,14336,2,8,4,1,power_law_1.2,0.10988800525665283
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,4096,14336,2,8,4,1,power_law_1.2,0.1130560040473938
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,4096,14336,2,8,4,1,power_law_1.2,0.12020479440689087
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,6144,16384,2,8,1,4,balanced,0.11932800213495891
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,6144,16384,2,8,1,4,balanced,0.21267199516296387
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,4096,14336,2,8,4,1,power_law_1.2,0.12718080282211303
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,6144,16384,2,8,1,4,balanced,0.11215466260910034
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,4096,14336,2,8,4,1,power_law_1.2,0.13313920497894288
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,6144,16384,2,8,1,4,balanced,0.17694399754206339
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,6144,16384,2,8,1,4,balanced,0.1755146582921346
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,6144,16384,2,8,1,4,balanced,0.30484267075856525
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,6144,16384,2,8,1,4,balanced,0.18023999532063803
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,6144,16384,2,8,1,4,balanced,0.3155253330866496
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,4096,14336,2,8,4,1,power_law_1.2,0.1334272027015686
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,6144,16384,2,8,1,4,balanced,0.1800373395284017
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,6144,16384,2,8,1,4,balanced,0.3084320028622945
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,4096,14336,2,8,4,1,power_law_1.2,0.1446720004081726
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,6144,16384,2,8,1,4,balanced,0.18286399046579996
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,6144,16384,2,8,1,4,balanced,0.31006399790445965
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,6144,16384,2,8,1,4,balanced,0.18344000975290933
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,6144,16384,2,8,1,4,balanced,0.31175466378529865
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,6144,16384,2,8,1,4,power_law_1.01,0.31658880710601806
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,4096,14336,2,8,4,1,power_law_1.2,0.14247679710388184
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,6144,16384,2,8,1,4,balanced,0.1852160096168518
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,6144,16384,2,8,1,4,balanced,0.31176533301671344
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,6144,16384,2,8,1,4,power_law_1.01,0.26093440055847167
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,4096,14336,2,8,4,1,power_law_1.2,0.14718719720840454
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,6144,16384,2,8,1,4,balanced,0.1855199933052063
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,6144,16384,2,8,1,4,balanced,0.32235199213027954
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,4096,14336,2,8,4,1,power_law_1.2,0.1494271993637085
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,6144,16384,2,8,1,4,power_law_1.01,0.28019840717315675
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,6144,16384,2,8,1,4,balanced,0.3272533416748047
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,6144,16384,2,8,1,4,balanced,0.1899413267771403
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,4096,14336,2,8,4,1,power_law_1.2,0.1723456025123596
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,6144,16384,2,8,1,4,balanced,0.32679466406504315
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,6144,16384,2,8,1,4,power_law_1.01,0.3093951940536499
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,6144,16384,2,8,1,4,balanced,0.19036799669265747
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,6144,16384,2,8,1,4,balanced,0.3322826623916626
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,6144,16384,2,8,1,4,power_law_1.01,0.3097343921661377
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,6144,16384,2,8,1,4,balanced,0.18971200784047446
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,4096,14336,2,8,4,1,power_law_1.2,0.18354560136795045
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,6144,16384,2,8,1,4,balanced,0.3373653491338094
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,6144,16384,2,8,1,4,power_law_1.01,0.3441663980484009
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,6144,16384,2,8,1,4,balanced,0.19341333707173666
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,4096,14336,2,8,4,1,power_law_1.2,0.19156479835510254
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,6144,16384,2,8,1,4,balanced,0.1092746655146281
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,6144,16384,2,8,1,4,balanced,0.3550293445587158
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,6144,16384,2,8,1,4,power_law_1.01,0.3542207956314087
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,6144,16384,2,8,1,4,balanced,0.20971200863520303
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,4096,14336,2,8,4,1,power_law_1.2,0.22807040214538574
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,6144,16384,2,8,1,4,balanced,0.10259200135866801
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,6144,16384,2,8,1,4,balanced,0.3821440140406291
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,6144,16384,2,8,1,4,power_law_1.01,0.3575999975204468
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,6144,16384,2,8,1,4,balanced,0.2230506738026937
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,4096,14336,2,8,4,1,power_law_1.2,0.2829056024551392
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,6144,16384,2,8,1,4,balanced,0.17404266198476157
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,6144,16384,2,8,1,4,balanced,0.38840532302856445
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,6144,16384,2,8,1,4,balanced,0.2280906637509664
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,4096,14336,2,8,4,1,power_law_1.2,0.34292480945587156
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,6144,16384,2,8,1,4,power_law_1.01,0.42344961166381834
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,6144,16384,2,8,1,4,balanced,0.17653866608937582
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,6144,16384,2,8,1,4,balanced,0.4033546845118205
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,6144,16384,2,8,1,4,power_law_1.01,0.18563200235366822
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,6144,16384,2,8,1,4,balanced,0.2392959992090861
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,6144,16384,2,8,1,4,power_law_1.01,0.4627520084381104
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,6144,16384,2,8,1,4,balanced,0.17859200636545816
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,6144,16384,2,8,1,4,balanced,0.5139306783676147
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,4096,14336,2,8,4,1,power_law_1.2,0.475110387802124
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,6144,16384,2,8,1,4,power_law_1.01,0.14140160083770753
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,6144,16384,2,8,1,4,balanced,0.28275199731191
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,6144,16384,2,8,1,4,power_law_1.01,0.4780223846435547
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,6144,16384,2,8,1,4,balanced,0.17985600233078003
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,6144,16384,2,8,1,4,power_law_1.01,0.14771840572357178
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,6144,16384,2,8,1,4,balanced,0.4666186571121216
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,4096,14336,2,8,4,1,power_law_1.2,0.618668794631958
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,6144,16384,2,8,1,4,power_law_1.01,0.17952640056610109
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,6144,16384,2,8,1,4,power_law_1.01,0.5839424133300781
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,6144,16384,2,8,1,4,balanced,0.29028799136479694
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,6144,16384,2,8,1,4,balanced,0.18125865856806436
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,6144,16384,2,8,1,4,balanced,0.7351679801940918
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,4096,14336,2,8,4,1,power_law_1.2,0.8930368423461914
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,6144,16384,2,8,1,4,power_law_1.01,0.1804800033569336
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,6144,16384,2,8,1,4,power_law_1.01,0.6789696216583252
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,6144,16384,2,8,1,4,balanced,0.18147732814153036
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,6144,16384,2,8,1,4,power_law_1.01,0.19988479614257812
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,4096,14336,2,8,4,1,power_law_1.2,1.1698944091796875
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,6144,16384,2,8,1,4,balanced,0.8487626711527506
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,6144,16384,2,8,1,4,power_law_1.01,0.24522879123687744
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,6144,16384,2,8,1,4,balanced,0.43858667214711505
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,6144,16384,2,8,1,4,power_law_1.01,0.49256319999694825
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,6144,16384,2,8,1,4,power_law_1.01,0.21766400337219238
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,4096,14336,2,8,4,1,power_law_1.2,1.7021503448486328
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,6144,16384,2,8,1,4,balanced,1.241434653600057
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,6144,16384,2,8,1,4,power_law_1.01,0.5624576091766358
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,6144,16384,2,8,1,4,power_law_1.01,0.22323200702667237
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,4096,14336,2,8,4,1,power_law_1.2,2.236416053771973
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,6144,16384,2,8,1,4,power_law_1.01,0.71561598777771
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,6144,16384,2,8,1,4,power_law_1.01,0.23343360424041748
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,6144,16384,2,8,1,4,balanced,0.5099146763483683
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,6144,16384,2,8,1,4,balanced,1.494874636332194
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,6144,16384,2,8,1,4,power_law_1.01,0.2350719928741455
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,6144,16384,2,8,1,4,power_law_1.01,0.6444287776947022
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,4096,14336,2,8,4,1,power_law_1.2,3.2899776458740235
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,6144,16384,2,8,1,4,balanced,0.1813066601753235
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,6144,16384,2,8,1,4,power_law_1.01,0.23943679332733153
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,6144,16384,2,8,1,4,power_law_1.01,0.8949695587158203
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,6144,16384,2,8,1,4,balanced,2.295482635498047
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,6144,16384,2,8,1,4,power_law_1.01,0.25632638931274415
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,4096,14336,2,8,4,1,power_law_1.2,4.386553573608398
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,6144,16384,2,8,1,4,balanced,0.7332959969838461
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,6144,16384,2,8,1,4,balanced,0.18337599436442056
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,6144,16384,2,8,1,4,power_law_1.01,0.9973952293395996
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,6144,16384,2,8,1,4,power_law_1.01,0.2979840040206909
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,4096,14336,2,8,4,1,power_law_1.2,5.459199905395508
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,6144,16384,2,8,1,4,power_law_1.01,0.3650752067565918
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,6144,16384,2,8,1,4,balanced,2.932405471801758
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,6144,16384,2,8,1,4,power_law_1.01,0.15094399452209473
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,6144,16384,2,8,1,4,power_law_1.01,1.3251839637756349
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,6144,16384,2,8,1,4,balanced,0.8956800301869711
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,6144,16384,2,8,1,4,power_law_1.01,0.412505578994751
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,6144,16384,2,8,1,4,power_law_1.01,2.0248767852783205
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,6144,16384,2,8,1,4,power_law_1.01,0.1743232011795044
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,6144,16384,2,8,1,4,power_law_1.01,0.40685439109802246
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,4096,14336,2,8,4,1,power_law_1.2,8.710431671142578
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,6144,16384,2,8,1,4,power_law_1.01,0.6123583793640137
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,6144,16384,2,8,1,4,power_law_1.01,0.1453760027885437
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,6144,16384,2,8,1,4,balanced,4.390927950541179
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,6144,16384,2,8,1,4,power_law_1.01,3.0357696533203127
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,6144,16384,2,8,1,4,balanced,1.344165325164795
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,6144,16384,2,8,1,4,power_law_1.01,0.6130047798156738
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,6144,16384,2,8,1,4,power_law_1.01,0.17694079875946045
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,6144,16384,2,8,1,4,power_law_1.01,3.9482688903808594
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,4096,14336,2,8,4,1,power_law_1.2,17.373452758789064
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,6144,16384,2,8,1,4,power_law_1.01,0.7681600093841553
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,6144,16384,2,8,1,4,power_law_1.01,0.17838720083236695
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,6144,16384,2,8,1,4,power_law_1.01,1.0506303787231446
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,6144,16384,2,8,1,4,balanced,1.7176052729288738
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,6144,16384,2,8,1,4,balanced,0.1877280076344808
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,6144,16384,2,8,1,4,power_law_1.2,0.31661438941955566
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,6144,16384,2,8,1,4,power_law_1.01,5.736665725708008
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,6144,16384,2,8,1,4,power_law_1.01,0.22322559356689453
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,6144,16384,2,8,1,4,balanced,6.080602645874023
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,6144,16384,2,8,1,4,power_law_1.01,1.3565247535705567
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,6144,16384,2,8,1,4,balanced,0.191210667292277
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,6144,16384,2,8,1,4,power_law_1.2,0.2887808084487915
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,6144,16384,2,8,1,4,power_law_1.01,0.2555840015411377
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,6144,16384,2,8,1,4,power_law_1.01,2.326969528198242
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,6144,16384,2,8,1,4,power_law_1.01,9.029593658447265
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,6144,16384,2,8,1,4,balanced,2.537391980489095
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,6144,16384,2,8,1,4,balanced,0.19527999560038248
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,6144,16384,2,8,1,4,power_law_1.01,3.1987327575683593
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,6144,16384,2,8,1,4,power_law_1.01,0.2534847974777222
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,6144,16384,2,8,1,4,power_law_1.2,0.30730879306793213
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,6144,16384,2,8,1,4,balanced,0.1977013349533081
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,6144,16384,2,8,1,4,power_law_1.01,3.5375232696533203
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,6144,16384,2,8,1,4,power_law_1.01,10.565817260742188
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,6144,16384,2,8,1,4,balanced,7.79744021097819
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,6144,16384,2,8,1,4,power_law_1.2,0.30974080562591555
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,6144,16384,2,8,1,4,power_law_1.01,7.636370849609375
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,6144,16384,2,8,1,4,power_law_1.2,0.3100543975830078
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,6144,16384,2,8,1,4,balanced,3.3525492350260415
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,6144,16384,2,8,1,4,power_law_1.01,0.25832960605621336
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,6144,16384,2,8,1,4,power_law_1.01,17.857862854003905
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,6144,16384,2,8,1,4,power_law_1.01,7.427142333984375
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,6144,16384,2,8,1,4,power_law_1.2,0.33445119857788086
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,6144,16384,2,8,1,4,power_law_1.01,0.2489856004714966
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,6144,16384,2,8,1,4,balanced,0.21493866046269736
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,6144,16384,2,8,1,4,power_law_1.2,0.35537281036376955
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,6144,16384,2,8,1,4,power_law_1.01,12.210771179199218
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,6144,16384,2,8,1,4,power_law_1.01,17.33675537109375
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,6144,16384,2,8,1,4,balanced,0.22086399793624878
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,6144,16384,2,8,1,4,balanced,4.177573204040527
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,6144,16384,2,8,1,4,balanced,12.531898498535156
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,6144,16384,2,8,1,4,power_law_1.2,0.36726400852203367
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,6144,16384,2,8,1,4,power_law_1.01,0.24255359172821045
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,6144,16384,2,8,1,4,power_law_1.01,18.494744873046876
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,6144,16384,2,8,1,4,balanced,0.22992000977198282
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,6144,16384,2,8,1,4,power_law_1.2,0.411897611618042
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,6144,16384,2,8,1,4,power_law_1.01,0.2578495979309082
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,6144,16384,2,8,1,4,balanced,0.3343626658121745
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,6144,16384,2,8,1,4,power_law_1.2,0.4262400150299072
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,6144,16384,2,8,1,4,power_law_1.01,37.54222717285156
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,6144,16384,2,8,1,4,power_law_1.01,0.27559680938720704
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,6144,16384,2,8,1,4,balanced,0.3582719961802165
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,6144,16384,2,8,1,4,power_law_1.2,0.48051838874816893
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,6144,16384,2,8,1,4,power_law_1.01,0.3305855989456177
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,6144,16384,2,8,1,4,power_law_1.01,33.800146484375
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,6144,16384,2,8,1,4,balanced,6.8961976369222
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,6144,16384,2,8,1,4,balanced,0.5312533378601074
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,6144,16384,2,8,1,4,power_law_1.2,0.5377471923828125
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,6144,16384,2,8,1,4,power_law_1.2,0.648518419265747
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,6144,16384,2,8,1,4,balanced,0.7007306416829427
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,6144,16384,2,8,1,4,power_law_1.01,0.34391040802001954
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,6144,16384,2,8,1,4,power_law_1.2,0.5468480110168457
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,6144,16384,2,8,1,4,power_law_1.01,0.3469311952590942
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,6144,16384,2,8,1,4,power_law_1.01,62.877838134765625
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,6144,16384,2,8,1,4,power_law_1.2,0.608518409729004
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,6144,16384,2,8,1,4,power_law_1.01,0.4293824195861816
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,6144,16384,2,8,1,4,balanced,24.566848754882812
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,6144,16384,2,8,1,4,power_law_1.2,0.7424064159393311
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,6144,16384,2,8,1,4,power_law_1.01,0.6163839817047119
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,6144,16384,2,8,1,4,balanced,1.0657013257344563
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,6144,16384,2,8,1,4,power_law_1.2,0.5947711944580079
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,6144,16384,2,8,1,4,power_law_1.01,1.0253824234008788
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,6144,16384,2,8,1,4,power_law_1.2,0.9750783920288086
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,6144,16384,2,8,1,4,power_law_1.01,1.2668416023254394
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,6144,16384,2,8,1,4,balanced,1.3940480550130208
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,6144,16384,2,8,1,4,power_law_1.2,0.9602560043334961
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,6144,16384,2,8,1,4,power_law_1.01,1.8036224365234375
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,6144,16384,2,8,1,4,balanced,14.222442626953125
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,6144,16384,2,8,1,4,balanced,2.100560029347738
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,6144,16384,2,8,1,4,power_law_1.2,1.8432384490966798
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,6144,16384,2,8,1,4,power_law_1.01,2.5915327072143555
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,6144,16384,2,8,1,4,power_law_1.2,1.9999168395996094
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,6144,16384,2,8,1,4,balanced,2.7868852615356445
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,6144,16384,2,8,1,4,power_law_1.01,4.130656051635742
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,6144,16384,2,8,1,4,power_law_1.2,2.768044853210449
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,6144,16384,2,8,1,4,power_law_1.01,6.144268798828125
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,6144,16384,2,8,1,4,power_law_1.2,3.2818817138671874
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,6144,16384,2,8,1,4,balanced,4.234042803446452
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,6144,16384,2,8,1,4,power_law_1.01,6.652006530761719
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,6144,16384,2,8,1,4,power_law_1.2,6.9506690979003904
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,6144,16384,2,8,1,4,balanced,5.6312001546223955
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,6144,16384,2,8,1,4,power_law_1.01,12.345753479003907
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,6144,16384,2,8,1,4,power_law_1.2,8.485056304931641
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,6144,16384,2,8,1,4,power_law_1.01,18.414694213867186
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,6144,16384,2,8,1,4,power_law_1.2,14.682015991210937
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,6144,16384,2,8,1,4,balanced,7.144912083943685
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,6144,16384,2,8,1,4,power_law_1.01,17.983392333984376
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,6144,16384,2,8,1,4,power_law_1.2,22.61664581298828
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,6144,16384,2,8,1,4,power_law_1.2,22.540019226074218
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,6144,16384,2,8,1,4,power_law_1.01,37.170266723632814
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,6144,16384,2,8,1,4,balanced,11.631882985432943
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,6144,16384,2,8,1,4,power_law_1.2,42.224615478515624
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,6144,16384,2,8,1,4,power_law_1.01,78.83615112304688
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,6144,16384,2,8,1,4,power_law_1.2,83.12958374023438
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,6144,16384,2,8,1,4,balanced,25.18018086751302
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,6144,16384,2,8,1,4,power_law_1.2,0.1703871965408325
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,6144,16384,2,8,1,4,power_law_1.2,0.1537343978881836
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,6144,16384,2,8,1,4,power_law_1.2,0.17344640493392943
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,6144,16384,2,8,1,4,power_law_1.2,0.17545599937438966
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,6144,16384,2,8,1,4,power_law_1.2,0.17946239709854125
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,6144,16384,2,8,1,4,power_law_1.2,0.19648640155792235
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,6144,16384,2,8,1,4,power_law_1.2,0.21500160694122314
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,6144,16384,2,8,1,4,power_law_1.2,0.20791680812835694
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,6144,16384,2,8,1,4,power_law_1.2,0.23047680854797364
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,6144,16384,2,8,1,4,power_law_1.2,0.2370687961578369
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,6144,16384,2,8,1,4,power_law_1.2,0.2294912099838257
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,6144,16384,2,8,1,4,power_law_1.2,0.272761607170105
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,6144,16384,2,8,1,4,power_law_1.2,0.26720640659332273
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,6144,16384,2,8,1,4,power_law_1.2,0.32870399951934814
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,6144,16384,2,8,1,4,power_law_1.2,0.3783168077468872
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,6144,16384,2,8,1,4,power_law_1.2,0.44617600440979005
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,6144,16384,2,8,1,4,power_law_1.2,0.43958401679992676
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,6144,16384,2,8,1,4,power_law_1.2,0.653062391281128
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,6144,16384,2,8,1,4,power_law_1.2,0.6768511772155762
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,6144,16384,2,8,2,2,balanced,0.06782400111357371
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,6144,16384,2,8,2,2,balanced,0.11526933312416077
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,6144,16384,2,8,1,4,power_law_1.2,0.7360767841339111
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,6144,16384,2,8,2,2,balanced,0.10331199566523235
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,6144,16384,2,8,2,2,balanced,0.1647040049235026
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,6144,16384,2,8,1,4,power_law_1.2,0.1600000023841858
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,6144,16384,2,8,2,2,balanced,0.17182934284210205
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,6144,16384,2,8,1,4,power_law_1.2,0.16019200086593627
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,6144,16384,2,8,2,2,balanced,0.31169599294662476
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,6144,16384,2,8,1,4,power_law_1.2,1.2528639793395997
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,6144,16384,2,8,1,4,power_law_1.2,0.14587520360946654
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,6144,16384,2,8,2,2,balanced,0.17474132776260376
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,6144,16384,2,8,2,2,balanced,0.3038880030314128
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,6144,16384,2,8,1,4,power_law_1.2,1.6483072280883788
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,6144,16384,2,8,1,4,power_law_1.2,0.17709439992904663
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,6144,16384,2,8,1,4,power_law_1.2,0.17927039861679078
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,6144,16384,2,8,2,2,balanced,0.17595199743906656
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,6144,16384,2,8,2,2,balanced,0.3039733370145162
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,6144,16384,2,8,1,4,power_law_1.2,2.4790143966674805
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,6144,16384,2,8,1,4,power_law_1.2,0.2141632080078125
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,6144,16384,2,8,2,2,balanced,0.30713067452112836
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,6144,16384,2,8,2,2,balanced,0.17646400133768717
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,6144,16384,2,8,1,4,power_law_1.2,0.25265278816223147
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,6144,16384,2,8,1,4,power_law_1.2,3.1785856246948243
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,6144,16384,2,8,1,4,power_law_1.2,0.29279360771179197
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,6144,16384,2,8,2,2,balanced,0.17801066239674887
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,6144,16384,2,8,2,2,balanced,0.3060693343480428
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,6144,16384,2,8,1,4,power_law_1.2,4.003334426879883
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,6144,16384,2,8,2,2,balanced,0.1814240018526713
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,6144,16384,2,8,2,2,balanced,0.3084533413251241
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,6144,16384,2,8,2,2,balanced,0.18099733193715414
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,6144,16384,2,8,1,4,power_law_1.2,0.26457600593566893
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,6144,16384,2,8,2,2,balanced,0.31910934050877887
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,6144,16384,2,8,1,4,power_law_1.2,8.241248321533202
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,6144,16384,2,8,1,4,power_law_1.2,0.2643647909164429
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,6144,16384,2,8,2,2,balanced,0.18346667289733887
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,6144,16384,2,8,2,2,balanced,0.31997867425282794
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,6144,16384,2,8,2,2,balanced,0.19232000907262167
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,6144,16384,2,8,1,4,power_law_1.2,12.609983825683594
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,6144,16384,2,8,2,2,balanced,0.331061323483785
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,6144,16384,2,8,2,2,balanced,0.06272533535957336
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,6144,16384,2,8,1,4,power_law_1.2,0.25063679218292234
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,6144,16384,2,8,2,2,balanced,0.1885706583658854
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,6144,16384,2,8,2,2,balanced,0.33133333921432495
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,6144,16384,2,8,2,2,balanced,0.09829333424568176
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,6144,16384,2,8,1,4,power_law_1.2,0.2798719882965088
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,6144,16384,2,8,1,4,power_law_1.2,15.880653381347656
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,6144,16384,2,8,2,2,balanced,0.19050133228302002
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,6144,16384,2,8,2,2,balanced,0.33323200543721515
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,6144,16384,2,8,1,4,power_law_1.2,0.28159360885620116
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,6144,16384,2,8,2,2,balanced,0.16846932967503866
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,6144,16384,2,8,2,2,balanced,0.2015413244565328
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,6144,16384,2,8,1,4,power_law_1.2,0.3672447919845581
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,6144,16384,2,8,2,2,balanced,0.34891732533772785
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,6144,16384,2,8,2,2,balanced,0.1714400053024292
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,6144,16384,2,8,2,2,balanced,0.21282132466634116
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,6144,16384,2,8,1,4,power_law_1.2,17.304135131835938
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,6144,16384,2,8,2,2,balanced,0.35606932640075684
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,6144,16384,2,8,2,2,balanced,0.17358932892481485
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,6144,16384,2,8,1,4,power_law_1.2,0.3313215970993042
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,6144,16384,2,8,2,2,balanced,0.21468265851338705
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,6144,16384,2,8,2,2,balanced,0.17617066701253256
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,6144,16384,2,8,2,2,balanced,0.35631998380025226
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,6144,16384,2,8,1,4,power_law_1.2,0.362828803062439
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,6144,16384,2,8,2,2,balanced,0.21987199783325195
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,6144,16384,2,8,1,4,power_law_1.2,0.44991359710693357
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,6144,16384,2,8,2,2,balanced,0.1776533325513204
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,6144,16384,2,8,2,2,balanced,0.36999468008677167
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,6144,16384,2,8,1,4,power_law_1.2,0.7187007904052735
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,6144,16384,2,8,2,2,balanced,0.312394658724467
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,6144,16384,2,8,2,2,balanced,0.1783413290977478
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,6144,16384,2,8,1,4,power_law_1.2,45.47544860839844
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,6144,16384,2,8,1,4,power_law_1.2,0.8183232307434082
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,6144,16384,2,8,2,2,balanced,0.4909813404083252
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,6144,16384,2,8,2,2,balanced,0.30610666672388714
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,6144,16384,2,8,1,4,power_law_1.2,1.5244735717773437
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,6144,16384,2,8,2,2,balanced,0.49059732755025226
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,6144,16384,2,8,1,4,power_law_1.2,1.6220159530639648
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,6144,16384,2,8,2,2,balanced,0.418559988339742
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,6144,16384,2,8,2,2,balanced,0.6764533519744873
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,6144,16384,2,8,2,2,balanced,0.493887980779012
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,6144,16384,2,8,1,4,power_law_1.2,3.819820785522461
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,6144,16384,2,8,2,2,balanced,0.18240533272425333
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,6144,16384,2,8,2,2,balanced,0.7924746672312418
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,6144,16384,2,8,2,2,balanced,0.7254559993743896
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,6144,16384,2,8,1,4,power_law_1.2,3.603718566894531
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,6144,16384,2,8,2,2,balanced,0.18386665980021158
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,6144,16384,2,8,2,2,power_law_1.01,0.13506560325622557
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,6144,16384,2,8,1,4,power_law_1.2,7.2943168640136715
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,6144,16384,2,8,2,2,balanced,1.1974986394246419
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,6144,16384,2,8,2,2,balanced,0.9220746358235677
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,6144,16384,2,8,2,2,power_law_1.01,0.1803264021873474
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,6144,16384,2,8,1,4,power_law_1.2,8.418418884277344
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,6144,16384,2,8,2,2,balanced,1.527781327565511
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,6144,16384,2,8,2,2,balanced,1.3495359420776367
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,6144,16384,2,8,2,2,power_law_1.01,0.2071552038192749
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,6144,16384,2,8,1,4,power_law_1.2,10.83096923828125
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,6144,16384,2,8,2,2,power_law_1.01,0.2952768087387085
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,6144,16384,2,8,2,2,balanced,2.2678613662719727
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,6144,16384,2,8,2,2,balanced,1.771509329477946
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,6144,16384,2,8,1,4,power_law_1.2,20.583827209472656
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,6144,16384,2,8,2,2,power_law_1.01,0.3026112079620361
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,6144,16384,2,8,2,2,power_law_1.01,0.3092672109603882
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,6144,16384,2,8,2,2,balanced,0.18889600038528442
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,6144,16384,2,8,2,2,balanced,2.998933474222819
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,6144,16384,2,8,2,2,balanced,2.6113386154174805
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,6144,16384,2,8,1,4,power_law_1.2,26.208377075195312
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,6144,16384,2,8,2,2,power_law_1.01,0.32663679122924805
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,6144,16384,2,8,2,2,balanced,0.191594660282135
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,6144,16384,2,8,2,2,power_law_1.01,0.3181567907333374
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,6144,16384,2,8,2,2,power_law_1.01,0.08765439987182617
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,6144,16384,2,8,2,2,balanced,0.19647467136383057
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,6144,16384,2,8,2,2,balanced,4.533679962158203
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,6144,16384,2,8,2,2,power_law_1.01,0.3839679956436157
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,6144,16384,2,8,2,2,balanced,3.480549176534017
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,6144,16384,2,8,2,2,power_law_1.01,0.11807359457015991
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,6144,16384,2,8,2,2,balanced,0.19925334056218466
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,6144,16384,2,8,1,4,power_law_1.2,39.533477783203125
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,6144,16384,2,8,2,2,power_law_1.01,0.36389760971069335
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,6144,16384,2,8,2,2,power_law_1.01,0.11804159879684448
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,6144,16384,2,8,2,2,power_law_1.01,0.09123839735984803
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,6144,16384,2,8,2,2,power_law_1.01,0.37351040840148925
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,6144,16384,2,8,2,2,balanced,6.155775705973308
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,6144,16384,2,8,2,2,power_law_1.01,0.17523839473724365
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,6144,16384,2,8,2,2,power_law_1.01,0.40523519515991213
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,6144,16384,2,8,2,2,balanced,4.354960123697917
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,6144,16384,2,8,2,2,power_law_1.01,0.12318079471588135
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,6144,16384,2,8,2,2,power_law_1.01,0.17463680505752563
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,6144,16384,2,8,2,2,power_law_1.01,0.4311039924621582
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,6144,16384,2,8,2,2,balanced,0.22121065855026245
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,6144,16384,2,8,2,2,power_law_1.01,0.11546880006790161
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,6144,16384,2,8,2,2,power_law_1.01,0.1859455943107605
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,6144,16384,2,8,1,4,power_law_1.2,62.091009521484374
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,6144,16384,2,8,2,2,power_law_1.01,0.42783360481262206
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,6144,16384,2,8,2,2,balanced,0.2270080049832662
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,6144,16384,2,8,2,2,power_law_1.01,0.16070400476455687
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,6144,16384,2,8,2,2,power_law_1.01,0.1968832015991211
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,6144,16384,2,8,2,2,balanced,7.708085378011067
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,6144,16384,2,8,2,2,power_law_1.01,0.4917503833770752
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,6144,16384,2,8,2,2,balanced,0.23667200406392416
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,6144,16384,2,8,2,2,power_law_1.01,0.17404799461364745
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,6144,16384,2,8,2,2,power_law_1.01,0.1903040051460266
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,6144,16384,2,8,2,2,power_law_1.01,0.5141632080078125
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,6144,16384,2,8,2,2,balanced,7.1617279052734375
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,6144,16384,2,8,2,2,power_law_1.01,0.19660160541534424
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,6144,16384,2,8,2,2,balanced,0.34614400068918866
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,6144,16384,2,8,2,2,power_law_1.01,0.19790719747543334
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,6144,16384,2,8,2,2,power_law_1.01,0.21824638843536376
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,6144,16384,2,8,2,2,power_law_1.01,0.5625728130340576
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,6144,16384,2,8,2,2,balanced,0.36855467160542804
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,6144,16384,2,8,2,2,power_law_1.01,0.2041088104248047
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,6144,16384,2,8,2,2,power_law_1.01,0.227622389793396
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,6144,16384,2,8,2,2,power_law_1.01,0.6281599998474121
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,6144,16384,2,8,2,2,power_law_1.01,0.2050623893737793
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,6144,16384,2,8,2,2,balanced,12.384479522705078
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,6144,16384,2,8,2,2,power_law_1.01,0.8013055801391602
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,6144,16384,2,8,2,2,power_law_1.01,0.23018879890441896
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,6144,16384,2,8,2,2,power_law_1.01,1.006220817565918
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,6144,16384,2,8,2,2,power_law_1.01,0.21261439323425294
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,6144,16384,2,8,2,2,power_law_1.01,0.22306559085845948
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,6144,16384,2,8,2,2,balanced,0.5526826779047648
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,6144,16384,2,8,2,2,power_law_1.01,1.4529215812683105
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,6144,16384,2,8,2,2,power_law_1.01,0.23594880104064941
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,6144,16384,2,8,2,2,power_law_1.01,0.24335360527038574
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,6144,16384,2,8,2,2,balanced,0.7519786357879639
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,6144,16384,2,8,2,2,power_law_1.01,0.23927679061889648
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,6144,16384,2,8,2,2,power_law_1.01,2.11157112121582
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,6144,16384,2,8,2,2,balanced,14.261066436767578
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,6144,16384,2,8,2,2,power_law_1.01,0.2922175884246826
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,6144,16384,2,8,2,2,balanced,1.1343093713124592
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,6144,16384,2,8,2,2,power_law_1.01,2.494118309020996
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,6144,16384,2,8,2,2,power_law_1.01,0.2212928056716919
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,6144,16384,2,8,2,2,power_law_1.01,0.30008320808410643
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,6144,16384,2,8,2,2,power_law_1.01,0.23809919357299805
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,6144,16384,2,8,2,2,power_law_1.01,3.846681594848633
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,6144,16384,2,8,2,2,balanced,1.4886132876078289
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,6144,16384,2,8,2,2,power_law_1.01,0.36392319202423096
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,6144,16384,2,8,2,2,power_law_1.01,0.2643455982208252
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,6144,16384,2,8,2,2,power_law_1.01,4.834643173217773
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,6144,16384,2,8,2,2,balanced,25.281178792317707
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,6144,16384,2,8,2,2,power_law_1.01,0.4191103935241699
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,6144,16384,2,8,2,2,power_law_1.01,0.2812288045883179
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,6144,16384,2,8,2,2,balanced,2.2503627141316733
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,6144,16384,2,8,2,2,power_law_1.01,0.5839680194854736
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,6144,16384,2,8,2,2,power_law_1.01,6.532902526855469
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,6144,16384,2,8,2,2,power_law_1.01,0.6984000205993652
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,6144,16384,2,8,2,2,power_law_1.01,0.2784640073776245
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,6144,16384,2,8,2,2,balanced,2.9645814895629883
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,6144,16384,2,8,2,2,power_law_1.01,10.167596435546875
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,6144,16384,2,8,2,2,power_law_1.01,0.31820800304412844
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,6144,16384,2,8,2,2,power_law_1.01,1.1339584350585938
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,6144,16384,2,8,2,2,power_law_1.01,0.3474112033843994
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,6144,16384,2,8,2,2,power_law_1.01,1.5414912223815918
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,6144,16384,2,8,2,2,power_law_1.01,12.727641296386718
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,6144,16384,2,8,2,2,balanced,4.406522750854492
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,6144,16384,2,8,2,2,power_law_1.01,0.5188864231109619
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,6144,16384,2,8,2,2,power_law_1.01,2.2825279235839844
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,6144,16384,2,8,2,2,power_law_1.01,19.627059936523438
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,6144,16384,2,8,2,2,power_law_1.01,0.6067903995513916
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,6144,16384,2,8,2,2,power_law_1.01,2.8962112426757813
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,6144,16384,2,8,2,2,balanced,5.904938379923503
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,6144,16384,2,8,2,2,power_law_1.01,3.33043212890625
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,6144,16384,2,8,2,2,power_law_1.01,0.9874624252319336
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,6144,16384,2,8,2,2,power_law_1.01,4.414969635009766
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,6144,16384,2,8,2,2,power_law_1.01,1.0902591705322267
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,6144,16384,2,8,2,2,power_law_1.01,40.012542724609375
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,6144,16384,2,8,2,2,balanced,7.3874562581380205
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,6144,16384,2,8,2,2,power_law_1.01,7.994656372070312
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,6144,16384,2,8,2,2,power_law_1.01,1.857004737854004
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,6144,16384,2,8,2,2,power_law_1.01,10.70843505859375
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,6144,16384,2,8,2,2,power_law_1.01,2.6589311599731444
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,6144,16384,2,8,2,2,power_law_1.01,3.226265716552734
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,6144,16384,2,8,2,2,power_law_1.01,22.356282043457032
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,6144,16384,2,8,2,2,balanced,11.9486452738444
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,6144,16384,2,8,2,2,power_law_1.01,4.748524856567383
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,6144,16384,2,8,2,2,power_law_1.01,7.822745513916016
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,6144,16384,2,8,2,2,power_law_1.01,10.05261459350586
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,6144,16384,2,8,2,2,power_law_1.01,11.788518524169922
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,6144,16384,2,8,2,2,power_law_1.2,0.14534399509429932
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,6144,16384,2,8,2,2,power_law_1.01,16.122438049316408
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,6144,16384,2,8,2,2,balanced,25.17560577392578
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,6144,16384,2,8,2,2,power_law_1.2,0.17935359477996826
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,6144,16384,2,8,2,2,power_law_1.2,0.21785600185394288
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,6144,16384,2,8,2,2,power_law_1.2,0.3022847890853882
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,6144,16384,2,8,2,2,power_law_1.01,44.37730407714844
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,6144,16384,2,8,2,2,power_law_1.2,0.2935296058654785
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,6144,16384,2,8,2,2,power_law_1.2,0.31322879791259767
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,6144,16384,2,8,2,2,power_law_1.2,0.32972800731658936
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,6144,16384,2,8,2,2,power_law_1.2,0.3206912040710449
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,6144,16384,2,8,2,2,power_law_1.2,0.34478719234466554
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,6144,16384,2,8,2,2,power_law_1.2,0.3796479940414429
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,6144,16384,2,8,2,2,power_law_1.2,0.3933824062347412
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,6144,16384,2,8,2,2,power_law_1.2,0.38297600746154786
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,6144,16384,2,8,2,2,power_law_1.2,0.44873600006103515
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,6144,16384,2,8,2,2,power_law_1.2,0.4084928035736084
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,6144,16384,2,8,2,2,power_law_1.2,0.4807551860809326
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,6144,16384,2,8,2,2,power_law_1.2,0.48976640701293944
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,6144,16384,2,8,2,2,power_law_1.2,0.5919104099273682
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,6144,16384,2,8,2,2,power_law_1.2,0.6742015838623047
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,6144,16384,2,8,2,2,power_law_1.2,0.10486400127410889
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,6144,16384,2,8,2,2,power_law_1.2,0.7773824214935303
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,6144,16384,2,8,2,2,power_law_1.2,0.1022271990776062
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,6144,16384,2,8,2,2,power_law_1.2,1.1036800384521483
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,6144,16384,2,8,2,2,power_law_1.2,0.10371840000152588
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,6144,16384,2,8,2,2,power_law_1.2,1.3170559883117676
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,6144,16384,2,8,2,2,power_law_1.2,0.17590399980545043
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,6144,16384,2,8,2,2,power_law_1.2,1.8166847229003906
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,6144,16384,2,8,2,2,power_law_1.2,0.17412480115890502
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,6144,16384,2,8,2,2,power_law_1.2,2.48404483795166
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,6144,16384,2,8,2,2,power_law_1.2,0.18929280042648317
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,6144,16384,2,8,2,2,power_law_1.2,0.20698881149291992
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,6144,16384,2,8,2,2,power_law_1.2,3.7189056396484377
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,6144,16384,2,8,2,2,power_law_1.2,0.1889024019241333
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,6144,16384,2,8,2,2,power_law_1.2,5.303622436523438
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,6144,16384,2,8,2,2,power_law_1.2,0.19861119985580444
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,6144,16384,2,8,2,2,power_law_1.2,7.315641784667969
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,6144,16384,2,8,2,2,power_law_1.2,0.2064512014389038
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,6144,16384,2,8,2,2,power_law_1.2,0.20135679244995117
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,6144,16384,2,8,2,2,power_law_1.2,10.773484802246093
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,6144,16384,2,8,2,2,power_law_1.2,0.23454079627990723
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,6144,16384,2,8,2,2,power_law_1.2,0.2291327953338623
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,6144,16384,2,8,2,2,power_law_1.2,13.3891845703125
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,6144,16384,2,8,2,2,power_law_1.2,0.25096960067749025
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,6144,16384,2,8,2,2,power_law_1.2,0.28378241062164306
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,6144,16384,2,8,2,2,power_law_1.2,21.25669708251953
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,6144,16384,2,8,2,2,power_law_1.2,0.2931391954421997
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,6144,16384,2,8,4,1,balanced,0.1095199982325236
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,6144,16384,2,8,2,2,power_law_1.2,0.31169919967651366
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,6144,16384,2,8,4,1,balanced,0.1644213298956553
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,6144,16384,2,8,2,2,power_law_1.2,0.39359359741210936
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,6144,16384,2,8,4,1,balanced,0.30344533920288086
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,6144,16384,2,8,2,2,power_law_1.2,40.39388732910156
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,6144,16384,2,8,2,2,power_law_1.2,0.5061759948730469
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,6144,16384,2,8,2,2,power_law_1.2,0.08375040292739869
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,6144,16384,2,8,4,1,balanced,0.30453866720199585
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,6144,16384,2,8,2,2,power_law_1.2,0.6662079811096191
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,6144,16384,2,8,2,2,power_law_1.2,0.12355200052261353
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,6144,16384,2,8,4,1,balanced,0.30240533749262494
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,6144,16384,2,8,2,2,power_law_1.2,0.7578559875488281
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,6144,16384,2,8,4,1,balanced,0.3053013285001119
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,6144,16384,2,8,2,2,power_law_1.2,0.14633599519729615
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,6144,16384,2,8,2,2,power_law_1.2,1.12423677444458
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,6144,16384,2,8,4,1,balanced,0.3062826593716939
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,6144,16384,2,8,2,2,power_law_1.2,0.1720639944076538
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,6144,16384,2,8,4,1,balanced,0.30823467175165814
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,6144,16384,2,8,2,2,power_law_1.2,1.368671989440918
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,6144,16384,2,8,2,2,power_law_1.2,0.1685312032699585
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,6144,16384,2,8,4,1,balanced,0.31817599137624103
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,6144,16384,2,8,2,2,power_law_1.2,2.0099456787109373
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,6144,16384,2,8,2,2,power_law_1.2,0.19296640157699585
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,6144,16384,2,8,4,1,balanced,0.3206186691919963
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,6144,16384,2,8,2,2,power_law_1.2,0.22037119865417482
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,6144,16384,2,8,2,2,power_law_1.2,2.9930112838745115
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,6144,16384,2,8,4,1,balanced,0.33170666297276813
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,6144,16384,2,8,2,2,power_law_1.2,0.22958080768585204
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,6144,16384,2,8,2,2,power_law_1.2,3.9238014221191406
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,6144,16384,2,8,4,1,balanced,0.3256053328514099
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,6144,16384,2,8,4,1,balanced,0.07124799986680348
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,6144,16384,2,8,2,2,power_law_1.2,6.391827011108399
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,6144,16384,2,8,4,1,balanced,0.327349325021108
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,6144,16384,2,8,4,1,balanced,0.10062399506568909
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,6144,16384,2,8,2,2,power_law_1.2,0.22884480953216552
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,6144,16384,2,8,4,1,balanced,0.3535733222961426
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,6144,16384,2,8,2,2,power_law_1.2,7.408281707763672
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,6144,16384,2,8,4,1,balanced,0.16818133989969888
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,6144,16384,2,8,2,2,power_law_1.2,0.2396480083465576
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,6144,16384,2,8,4,1,balanced,0.3558080196380615
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,6144,16384,2,8,4,1,balanced,0.17201600472132364
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,6144,16384,2,8,2,2,power_law_1.2,12.996051025390624
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,6144,16384,2,8,4,1,balanced,0.3577653169631958
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,6144,16384,2,8,4,1,balanced,0.17436800400416055
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,6144,16384,2,8,4,1,balanced,0.3833226760228475
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,6144,16384,2,8,4,1,balanced,0.1760586698849996
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,6144,16384,2,8,2,2,power_law_1.2,0.21461119651794433
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,6144,16384,2,8,4,1,balanced,0.46781333287556964
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,6144,16384,2,8,4,1,balanced,0.17829867204030356
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,6144,16384,2,8,2,2,power_law_1.2,24.17439422607422
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,6144,16384,2,8,2,2,power_law_1.2,0.23401598930358886
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,6144,16384,2,8,4,1,balanced,0.4736800193786621
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,6144,16384,2,8,4,1,balanced,0.18069332838058472
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,6144,16384,2,8,2,2,power_law_1.2,0.24196479320526124
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,6144,16384,2,8,4,1,balanced,0.06612800061702728
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,6144,16384,2,8,4,1,balanced,0.6669440269470215
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,6144,16384,2,8,4,1,balanced,0.18004266421000162
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,6144,16384,2,8,2,2,power_law_1.2,0.2780224084854126
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,6144,16384,2,8,4,1,balanced,0.09818666179974873
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,6144,16384,2,8,4,1,balanced,0.8384746710459391
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,6144,16384,2,8,4,1,balanced,0.18091734250386557
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,6144,16384,2,8,4,1,balanced,0.16645866632461548
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,6144,16384,2,8,2,2,power_law_1.2,0.27864320278167726
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,6144,16384,2,8,4,1,balanced,0.18775999546051025
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,6144,16384,2,8,4,1,balanced,1.2146560351053874
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,6144,16384,2,8,4,1,balanced,0.1696000099182129
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,6144,16384,2,8,2,2,power_law_1.2,0.32664320468902586
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,6144,16384,2,8,4,1,balanced,0.18810667594273886
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,6144,16384,2,8,4,1,balanced,0.1722773313522339
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,6144,16384,2,8,4,1,balanced,1.595354715983073
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,6144,16384,2,8,4,1,power_law_1.01,0.10878080129623413
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,6144,16384,2,8,2,2,power_law_1.2,0.3726655960083008
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,6144,16384,2,8,4,1,balanced,0.1922773321469625
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,6144,16384,2,8,4,1,balanced,0.17421332995096842
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,6144,16384,2,8,4,1,power_law_1.01,0.07027199864387512
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,6144,16384,2,8,2,2,power_law_1.2,0.48496642112731936
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,6144,16384,2,8,4,1,power_law_1.01,0.13050240278244019
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,6144,16384,2,8,4,1,balanced,2.358527978261312
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,6144,16384,2,8,4,1,balanced,0.20563733577728271
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,6144,16384,2,8,4,1,balanced,0.17753599087397257
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,6144,16384,2,8,4,1,power_law_1.01,0.16698240041732787
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,6144,16384,2,8,2,2,power_law_1.2,0.655679988861084
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,6144,16384,2,8,4,1,power_law_1.01,0.08319360017776489
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,6144,16384,2,8,4,1,power_law_1.01,0.2978431940078735
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,6144,16384,2,8,4,1,balanced,0.21473066012064615
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,6144,16384,2,8,4,1,balanced,0.17939732472101846
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,6144,16384,2,8,4,1,power_law_1.01,0.29552640914916994
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,6144,16384,2,8,4,1,power_law_1.01,0.10603519678115844
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,6144,16384,2,8,4,1,balanced,3.1323200861612954
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,6144,16384,2,8,4,1,power_law_1.01,0.3118079900741577
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,6144,16384,2,8,4,1,balanced,0.21531200408935547
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,6144,16384,2,8,2,2,power_law_1.2,0.962611198425293
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,6144,16384,2,8,4,1,power_law_1.01,0.1693120002746582
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,6144,16384,2,8,4,1,power_law_1.01,0.3190144062042236
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,6144,16384,2,8,2,2,power_law_1.2,1.1466943740844726
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,6144,16384,2,8,4,1,balanced,0.22433600823084512
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,6144,16384,2,8,4,1,power_law_1.01,0.3133568048477173
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,6144,16384,2,8,4,1,power_law_1.01,0.16999679803848267
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,6144,16384,2,8,4,1,power_law_1.01,0.34276480674743653
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,6144,16384,2,8,4,1,power_law_1.01,0.1768704056739807
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,6144,16384,2,8,2,2,power_law_1.2,1.7688896179199218
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,6144,16384,2,8,4,1,balanced,4.58297602335612
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,6144,16384,2,8,4,1,balanced,0.30509867270787555
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,6144,16384,2,8,4,1,power_law_1.01,0.3436608076095581
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,6144,16384,2,8,4,1,power_law_1.01,0.1827712059020996
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,6144,16384,2,8,4,1,balanced,0.18307733535766602
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,6144,16384,2,8,2,2,power_law_1.2,2.4711551666259766
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,6144,16384,2,8,4,1,balanced,0.31013866265614826
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,6144,16384,2,8,4,1,power_law_1.01,0.35360639095306395
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,6144,16384,2,8,4,1,power_law_1.01,0.18413439989089966
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,6144,16384,2,8,4,1,balanced,0.18594133853912354
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,6144,16384,2,8,4,1,power_law_1.01,0.36871678829193116
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,6144,16384,2,8,2,2,power_law_1.2,3.334239959716797
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,6144,16384,2,8,4,1,balanced,0.43775999546051025
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,6144,16384,2,8,4,1,power_law_1.01,0.3873728036880493
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,6144,16384,2,8,4,1,balanced,6.198981602986653
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,6144,16384,2,8,4,1,power_law_1.01,0.1896064043045044
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,6144,16384,2,8,4,1,power_law_1.01,0.40842242240905763
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,6144,16384,2,8,2,2,power_law_1.2,4.576825714111328
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,6144,16384,2,8,4,1,balanced,0.5318026542663574
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,6144,16384,2,8,4,1,power_law_1.01,0.19208320379257202
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,6144,16384,2,8,4,1,power_law_1.01,0.4238976001739502
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,6144,16384,2,8,4,1,power_law_1.01,0.420959997177124
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,6144,16384,2,8,4,1,power_law_1.01,0.20419199466705323
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,6144,16384,2,8,2,2,power_law_1.2,6.94537582397461
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,6144,16384,2,8,4,1,balanced,0.7558133602142334
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,6144,16384,2,8,4,1,power_law_1.01,0.49610238075256347
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,6144,16384,2,8,4,1,balanced,7.6962935129801435
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,6144,16384,2,8,4,1,power_law_1.01,0.21013119220733642
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,6144,16384,2,8,4,1,power_law_1.01,0.5690368175506592
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,6144,16384,2,8,2,2,power_law_1.2,9.729881286621094
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,6144,16384,2,8,4,1,balanced,0.975050687789917
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,6144,16384,2,8,4,1,power_law_1.01,0.6505792140960693
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,6144,16384,2,8,4,1,power_law_1.01,0.21566081047058105
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,6144,16384,2,8,4,1,power_law_1.01,0.8585280418395996
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,6144,16384,2,8,4,1,power_law_1.01,0.23411839008331298
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,6144,16384,2,8,4,1,balanced,0.19390400250752768
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,6144,16384,2,8,2,2,power_law_1.2,11.559820556640625
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,6144,16384,2,8,4,1,power_law_1.01,0.9870400428771973
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,6144,16384,2,8,4,1,balanced,1.4132800102233887
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,6144,16384,2,8,4,1,power_law_1.01,1.3737919807434082
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,6144,16384,2,8,4,1,power_law_1.01,0.24929280281066896
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,6144,16384,2,8,4,1,balanced,0.19926400979359946
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,6144,16384,2,8,4,1,power_law_1.01,1.7309183120727538
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,6144,16384,2,8,4,1,power_law_1.01,0.25050880908966067
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,6144,16384,2,8,4,1,balanced,1.8905439376831055
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,6144,16384,2,8,4,1,balanced,0.20499199628829956
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,6144,16384,2,8,4,1,balanced,12.547332763671875
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,6144,16384,2,8,2,2,power_law_1.2,22.567462158203124
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,6144,16384,2,8,4,1,power_law_1.01,2.5281728744506835
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,6144,16384,2,8,4,1,power_law_1.01,0.2973759889602661
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,6144,16384,2,8,4,1,balanced,0.21217066049575806
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,6144,16384,2,8,4,1,power_law_1.01,3.2500415802001954
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,6144,16384,2,8,4,1,balanced,0.23806933561960855
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,6144,16384,2,8,4,1,power_law_1.01,0.34695680141448976
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,6144,16384,2,8,4,1,balanced,2.7567307154337564
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,6144,16384,2,8,4,1,power_law_1.01,4.9080768585205075
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,6144,16384,2,8,4,1,power_law_1.01,0.38373119831085206
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,6144,16384,2,8,4,1,balanced,0.24663466215133667
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,6144,16384,2,8,2,2,power_law_1.2,40.543948364257815
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,6144,16384,2,8,4,1,power_law_1.01,6.512230682373047
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,6144,16384,2,8,4,1,balanced,0.2611306707064311
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,6144,16384,2,8,4,1,power_law_1.01,0.5050943851470947
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,6144,16384,2,8,4,1,power_law_1.01,8.07175064086914
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,6144,16384,2,8,4,1,balanced,0.3813706636428833
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,6144,16384,2,8,4,1,balanced,3.71613343556722
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,6144,16384,2,8,4,1,power_law_1.01,0.5834432125091553
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,6144,16384,2,8,4,1,power_law_1.01,12.759916687011719
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,6144,16384,2,8,4,1,power_law_1.01,0.8082943916320801
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,6144,16384,2,8,4,1,balanced,0.42034133275349933
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,6144,16384,2,8,4,1,power_law_1.01,1.0534655570983886
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,6144,16384,2,8,4,1,balanced,0.6435253222783407
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,6144,16384,2,8,4,1,balanced,4.642719904581706
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,6144,16384,2,8,4,1,balanced,25.06561533610026
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,6144,16384,2,8,4,1,power_law_1.01,1.4832192420959474
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,6144,16384,2,8,4,1,power_law_1.01,25.48970947265625
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,6144,16384,2,8,4,1,balanced,0.8568639755249023
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,6144,16384,2,8,4,1,power_law_1.01,1.949305534362793
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,6144,16384,2,8,4,1,balanced,1.2791146437327068
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,6144,16384,2,8,4,1,power_law_1.01,2.832729530334473
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,6144,16384,2,8,4,1,balanced,1.6765653292338054
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,6144,16384,2,8,4,1,power_law_1.01,3.8673534393310547
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,6144,16384,2,8,4,1,balanced,7.421728134155273
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,6144,16384,2,8,4,1,balanced,2.5111893018086753
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,6144,16384,2,8,4,1,power_law_1.01,4.811910247802734
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,6144,16384,2,8,4,1,power_law_1.01,7.520941162109375
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,6144,16384,2,8,4,1,balanced,3.328746795654297
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,6144,16384,2,8,4,1,power_law_1.01,14.8935302734375
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,6144,16384,2,8,4,1,balanced,4.971813201904297
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,6144,16384,2,8,4,1,balanced,14.942906697591146
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,6144,16384,2,8,4,1,balanced,6.633989334106445
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,6144,16384,2,8,4,1,power_law_1.01,0.06451200246810913
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,6144,16384,2,8,4,1,power_law_1.01,0.0788096010684967
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,6144,16384,2,8,4,1,balanced,8.320730845133463
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,6144,16384,2,8,4,1,power_law_1.01,0.09916160106658936
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,6144,16384,2,8,4,1,power_law_1.01,0.16429439783096314
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,6144,16384,2,8,4,1,power_law_1.01,0.17198079824447632
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,6144,16384,2,8,4,1,power_law_1.01,0.18807679414749146
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,6144,16384,2,8,4,1,balanced,13.480714162190756
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,6144,16384,2,8,4,1,power_law_1.01,0.1921280026435852
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,6144,16384,2,8,4,1,power_law_1.01,0.21773440837860109
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,6144,16384,2,8,4,1,power_law_1.01,0.21044480800628662
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,6144,16384,2,8,4,1,power_law_1.2,0.10868480205535888
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,6144,16384,2,8,4,1,power_law_1.01,0.21842560768127442
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,6144,16384,2,8,4,1,power_law_1.2,0.12781440019607543
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,6144,16384,2,8,4,1,power_law_1.2,0.14819200038909913
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,6144,16384,2,8,4,1,power_law_1.2,0.2957632064819336
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,6144,16384,2,8,4,1,power_law_1.2,0.3011840105056763
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,6144,16384,2,8,4,1,power_law_1.01,0.20992000102996827
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,6144,16384,2,8,4,1,balanced,27.803029378255207
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,6144,16384,2,8,4,1,power_law_1.2,0.3115135908126831
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,6144,16384,2,8,4,1,power_law_1.2,0.31164801120758057
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,6144,16384,2,8,4,1,power_law_1.01,0.22221438884735106
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,6144,16384,2,8,4,1,power_law_1.2,0.32051839828491213
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,6144,16384,2,8,4,1,power_law_1.2,0.34224638938903806
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,6144,16384,2,8,4,1,power_law_1.01,0.22497920989990233
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,6144,16384,2,8,4,1,power_law_1.2,0.3565824031829834
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,6144,16384,2,8,4,1,power_law_1.2,0.34840960502624513
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,6144,16384,2,8,4,1,power_law_1.01,0.24513280391693115
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,6144,16384,2,8,4,1,power_law_1.2,0.36494081020355223
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,6144,16384,2,8,4,1,power_law_1.01,0.2699968099594116
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,6144,16384,2,8,4,1,power_law_1.2,0.3755392074584961
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,6144,16384,2,8,4,1,power_law_1.2,0.40470399856567385
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,6144,16384,2,8,4,1,power_law_1.01,0.2819008111953735
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,6144,16384,2,8,4,1,power_law_1.2,0.41878399848937986
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,6144,16384,2,8,4,1,power_law_1.01,0.33537280559539795
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,6144,16384,2,8,4,1,power_law_1.2,0.44161281585693357
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,6144,16384,2,8,4,1,power_law_1.2,0.4920383930206299
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,6144,16384,2,8,4,1,power_law_1.01,0.41558399200439455
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,6144,16384,2,8,4,1,power_law_1.2,0.578495979309082
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,6144,16384,2,8,4,1,power_law_1.2,0.6502975940704345
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,6144,16384,2,8,4,1,power_law_1.01,0.5167424201965332
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,6144,16384,2,8,4,1,power_law_1.2,0.8451264381408692
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,6144,16384,2,8,4,1,power_law_1.01,0.7388991832733154
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,6144,16384,2,8,4,1,power_law_1.2,0.9775487899780273
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,6144,16384,2,8,4,1,power_law_1.2,1.3578304290771483
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,6144,16384,2,8,4,1,power_law_1.01,0.9709695816040039
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,6144,16384,2,8,4,1,power_law_1.2,1.749305534362793
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,6144,16384,2,8,4,1,power_law_1.01,1.382688045501709
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,6144,16384,2,8,4,1,power_law_1.2,2.505670356750488
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,6144,16384,2,8,4,1,power_law_1.2,3.267795181274414
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,6144,16384,2,8,4,1,power_law_1.01,1.7906623840332032
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,6144,16384,2,8,4,1,power_law_1.2,4.752396774291992
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,6144,16384,2,8,4,1,power_law_1.01,2.6088064193725584
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,6144,16384,2,8,4,1,power_law_1.2,6.400300598144531
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,6144,16384,2,8,4,1,power_law_1.01,3.4620033264160157
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,6144,16384,2,8,4,1,power_law_1.2,8.020166778564453
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,6144,16384,2,8,4,1,power_law_1.01,5.107462310791016
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,6144,16384,2,8,4,1,power_law_1.2,12.751763153076173
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,6144,16384,2,8,4,1,power_law_1.01,6.7653953552246096
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,6144,16384,2,8,4,1,power_law_1.2,25.20720672607422
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,6144,16384,2,8,4,1,power_law_1.01,8.45955810546875
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,6144,16384,2,8,4,1,power_law_1.2,0.06995199918746949
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,6144,16384,2,8,4,1,power_law_1.01,13.540159606933594
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,6144,16384,2,8,4,1,power_law_1.2,0.0832256019115448
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,6144,16384,2,8,4,1,power_law_1.2,0.10243840217590332
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,6144,16384,2,8,4,1,power_law_1.2,0.16595840454101562
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,6144,16384,2,8,4,1,power_law_1.01,27.479776000976564
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,6144,16384,2,8,4,1,power_law_1.2,0.1728767991065979
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,6144,16384,2,8,4,1,power_law_1.2,0.1791808009147644
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,6144,16384,2,8,4,1,power_law_1.2,0.18465919494628907
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,6144,16384,2,8,4,1,power_law_1.2,0.18546559810638427
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,6144,16384,2,8,4,1,power_law_1.2,0.1867967963218689
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,6144,16384,2,8,4,1,power_law_1.2,0.1982208013534546
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,6144,16384,2,8,4,1,power_law_1.2,0.2065727949142456
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,6144,16384,2,8,4,1,power_law_1.2,0.06576640009880066
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,6144,16384,2,8,4,1,power_law_1.2,0.21437439918518067
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,6144,16384,2,8,4,1,power_law_1.2,0.22079360485076904
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,6144,16384,2,8,4,1,power_law_1.2,0.07052800059318542
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,6144,16384,2,8,4,1,power_law_1.2,0.23848319053649902
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,6144,16384,2,8,4,1,power_law_1.2,0.10085120201110839
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,6144,16384,2,8,4,1,power_law_1.2,0.16397440433502197
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,6144,16384,2,8,4,1,power_law_1.2,0.2446847915649414
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,6144,16384,2,8,4,1,power_law_1.2,0.170905601978302
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,6144,16384,2,8,4,1,power_law_1.2,0.2510528087615967
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,6144,16384,2,8,4,1,power_law_1.2,0.28860158920288087
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,6144,16384,2,8,4,1,power_law_1.2,0.1831936001777649
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,6144,16384,2,8,4,1,power_law_1.2,0.33235199451446534
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,6144,16384,2,8,4,1,power_law_1.2,0.20093441009521484
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,6144,16384,2,8,4,1,power_law_1.2,0.3854016065597534
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,6144,16384,2,8,4,1,power_law_1.2,0.20611200332641602
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,6144,16384,2,8,4,1,power_law_1.2,0.5188479900360108
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,6144,16384,2,8,4,1,power_law_1.2,0.6028351783752441
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,6144,16384,2,8,4,1,power_law_1.2,0.20894079208374022
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,6144,16384,2,8,4,1,power_law_1.2,0.826476764678955
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,6144,16384,2,8,4,1,power_law_1.2,0.2180095911026001
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,6144,16384,2,8,4,1,power_law_1.2,1.0591936111450195
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,6144,16384,2,8,4,1,power_law_1.2,1.487705612182617
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,6144,16384,2,8,4,1,power_law_1.2,1.930348777770996
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,6144,16384,2,8,4,1,power_law_1.2,0.20819199085235596
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,7168,2048,8,256,1,4,balanced,0.09001599748929341
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,6144,16384,2,8,4,1,power_law_1.2,2.8316287994384766
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,6144,16384,2,8,4,1,power_law_1.2,0.21731839179992676
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,7168,2048,8,256,1,4,balanced,0.12052800258000691
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,6144,16384,2,8,4,1,power_law_1.2,0.2333888053894043
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,6144,16384,2,8,4,1,power_law_1.2,3.9050048828125
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,6144,16384,2,8,4,1,power_law_1.2,0.2626559972763062
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,7168,2048,8,256,1,4,balanced,0.20092799266179404
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,6144,16384,2,8,4,1,power_law_1.2,4.90079345703125
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,6144,16384,2,8,4,1,power_law_1.2,0.28047358989715576
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,7168,2048,8,256,1,4,balanced,0.3651306629180908
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,6144,16384,2,8,4,1,power_law_1.2,0.28837759494781495
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,6144,16384,2,8,4,1,power_law_1.2,7.465497589111328
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,7168,2048,8,256,1,4,balanced,0.6916000048319498
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,6144,16384,2,8,4,1,power_law_1.2,0.32968959808349607
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,7168,2048,8,256,1,4,balanced,1.3406079610188801
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,6144,16384,2,8,4,1,power_law_1.2,0.4263296127319336
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,6144,16384,2,8,4,1,power_law_1.2,14.781861877441406
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,7168,2048,8,256,1,4,balanced,1.3310933113098145
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,6144,16384,2,8,4,1,power_law_1.2,0.5249792098999023
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,7168,2048,8,256,1,4,balanced,0.0658240020275116
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,7168,2048,8,256,1,4,balanced,1.3334719340006511
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,6144,16384,2,8,4,1,power_law_1.2,0.7391935825347901
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,7168,2048,8,256,1,4,balanced,0.08284266789754231
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,7168,2048,8,256,1,4,balanced,1.3328320185343425
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,6144,16384,2,8,4,1,power_law_1.2,0.9589376449584961
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,7168,2048,8,256,1,4,balanced,0.12588266531626383
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,7168,2048,8,256,1,4,balanced,1.3399732907613118
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,6144,16384,2,8,4,1,power_law_1.2,1.3407296180725097
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,7168,2048,8,256,1,4,balanced,0.21092800299326578
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,7168,2048,8,256,1,4,balanced,1.3422986666361492
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,6144,16384,2,8,4,1,power_law_1.2,1.7528959274291993
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,7168,2048,8,256,1,4,balanced,0.36902399857838947
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,7168,2048,8,256,1,4,balanced,1.3559412956237793
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,6144,16384,2,8,4,1,power_law_1.2,2.5845632553100586
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,7168,2048,8,256,1,4,balanced,0.6992586453755697
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,7168,2048,8,256,1,4,balanced,0.07273066540559132
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,7168,2048,8,256,1,4,balanced,1.35590394337972
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,7168,2048,8,256,1,4,balanced,0.7069546381632487
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,6144,16384,2,8,4,1,power_law_1.2,3.408345413208008
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,7168,2048,8,256,1,4,balanced,1.354863961537679
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,7168,2048,8,256,1,4,balanced,0.08933333555857341
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,7168,2048,8,256,1,4,balanced,0.6977759997049967
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,6144,16384,2,8,4,1,power_law_1.2,5.029369735717774
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,7168,2048,8,256,1,4,balanced,0.1381386617819468
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,7168,2048,8,256,1,4,balanced,1.3602666854858398
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,7168,2048,8,256,1,4,balanced,0.6979573567708334
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,6144,16384,2,8,4,1,power_law_1.2,6.693421173095703
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,7168,2048,8,256,1,4,balanced,0.21799467007319132
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,7168,2048,8,256,1,4,balanced,1.3738826115926106
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,7168,2048,8,256,1,4,balanced,0.7032426993052164
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,7168,2048,8,256,1,4,balanced,0.37860266367594403
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,7168,2048,8,256,1,4,balanced,0.7064692974090576
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,6144,16384,2,8,4,1,power_law_1.2,8.367807769775391
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,7168,2048,8,256,1,4,balanced,1.3830347061157227
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,7168,2048,8,256,1,4,balanced,0.7029759883880615
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,7168,2048,8,256,1,4,balanced,0.7121439774831136
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,7168,2048,8,256,1,4,balanced,1.450719992319743
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,7168,2048,8,256,1,4,balanced,0.7063573201497396
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,6144,16384,2,8,4,1,power_law_1.2,13.482176208496094
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,7168,2048,8,256,1,4,balanced,0.7272960344950358
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,7168,2048,8,256,1,4,balanced,0.7069706916809082
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,7168,2048,8,256,1,4,balanced,1.4561707178751628
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,7168,2048,8,256,1,4,balanced,0.7253599961598715
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,7168,2048,8,256,1,4,balanced,0.7086559931437174
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,7168,2048,8,256,1,4,balanced,0.7375306288401285
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,6144,16384,2,8,4,1,power_law_1.2,27.533465576171874
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,7168,2048,8,256,1,4,balanced,1.5232532819112141
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,7168,2048,8,256,1,4,balanced,0.7120160261789957
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,7168,2048,8,256,1,4,balanced,0.7449759642283121
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,7168,2048,8,256,1,4,balanced,0.7161173025767008
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,7168,2048,8,256,1,4,balanced,1.5912960370381672
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,7168,2048,8,256,1,4,balanced,0.7609972953796387
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,7168,2048,8,256,1,4,balanced,0.7218026320139567
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,7168,2048,8,256,1,4,power_law_1.01,0.22235519886016847
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,7168,2048,8,256,1,4,balanced,0.7268160184224447
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,7168,2048,8,256,1,4,balanced,0.7813599904378256
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,7168,2048,8,256,1,4,balanced,1.6665813128153484
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,7168,2048,8,256,1,4,power_law_1.01,0.3599679946899414
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,7168,2048,8,256,1,4,balanced,0.7373493512471517
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,7168,2048,8,256,1,4,balanced,0.8032693068186442
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,7168,2048,8,256,1,4,power_law_1.01,0.22901759147644044
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,7168,2048,8,256,1,4,balanced,0.7523146470387777
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,7168,2048,8,256,1,4,power_law_1.01,0.2984447956085205
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,7168,2048,8,256,1,4,balanced,1.7516853014628093
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,7168,2048,8,256,1,4,balanced,0.855013370513916
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,7168,2048,8,256,1,4,balanced,0.7638506889343262
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,7168,2048,8,256,1,4,power_law_1.01,0.5537024021148682
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,7168,2048,8,256,1,4,balanced,0.7821813424428304
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,7168,2048,8,256,1,4,balanced,0.9157493114471436
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,7168,2048,8,256,1,4,power_law_1.01,0.7125887870788574
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,7168,2048,8,256,1,4,power_law_1.01,0.946617603302002
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,7168,2048,8,256,1,4,balanced,2.342437267303467
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,7168,2048,8,256,1,4,balanced,0.9868106842041016
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,7168,2048,8,256,1,4,power_law_1.01,1.025926399230957
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,7168,2048,8,256,1,4,power_law_1.01,1.0653951644897461
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,7168,2048,8,256,1,4,balanced,0.827029307683309
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,7168,2048,8,256,1,4,power_law_1.01,1.0478079795837403
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,7168,2048,8,256,1,4,balanced,1.0732320149739583
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,7168,2048,8,256,1,4,balanced,2.4797226587931314
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,7168,2048,8,256,1,4,power_law_1.01,1.1426560401916503
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,7168,2048,8,256,1,4,power_law_1.01,1.2412223815917969
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,7168,2048,8,256,1,4,power_law_1.01,1.1931520462036134
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,7168,2048,8,256,1,4,balanced,1.4606720606486003
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,7168,2048,8,256,1,4,power_law_1.01,1.210655975341797
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,7168,2048,8,256,1,4,power_law_1.01,1.1978560447692872
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,256,1,4,balanced,0.8884533246358236
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,7168,2048,8,256,1,4,power_law_1.01,1.2681856155395508
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,7168,2048,8,256,1,4,balanced,3.3412373860677085
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,7168,2048,8,256,1,4,power_law_1.01,1.3554431915283203
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,7168,2048,8,256,1,4,balanced,1.6286080678304036
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,256,1,4,balanced,0.9845813115437826
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,7168,2048,8,256,1,4,power_law_1.01,1.5261119842529296
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,7168,2048,8,256,1,4,power_law_1.01,1.6290687561035155
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,256,1,4,balanced,1.066111962000529
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,7168,2048,8,256,1,4,power_law_1.01,2.0396223068237305
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,7168,2048,8,256,1,4,power_law_1.01,1.7051519393920898
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,256,1,4,balanced,1.3280373414357503
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,7168,2048,8,256,1,4,power_law_1.01,0.13333760499954223
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,7168,2048,8,256,1,4,power_law_1.01,1.9869632720947266
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,7168,2048,8,256,1,4,power_law_1.01,0.20185599327087403
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,7168,2048,8,256,1,4,balanced,2.28492800394694
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,7168,2048,8,256,1,4,balanced,4.375626564025879
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,7168,2048,8,256,1,4,power_law_1.01,2.2300416946411135
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,256,1,4,balanced,1.4683574040730794
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,7168,2048,8,256,1,4,power_law_1.01,0.1204416036605835
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,7168,2048,8,256,1,4,power_law_1.01,2.817132759094238
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,7168,2048,8,256,1,4,power_law_1.01,0.16631040573120118
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,7168,2048,8,256,1,4,power_law_1.01,0.2791680097579956
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,7168,2048,8,256,1,4,power_law_1.01,3.5210113525390625
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,7168,2048,8,256,1,4,power_law_1.01,0.4017471790313721
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,256,1,4,balanced,2.2658027013142905
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,7168,2048,8,256,1,4,power_law_1.01,4.733267211914063
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,7168,2048,8,256,1,4,power_law_1.01,0.492633581161499
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,7168,2048,8,256,1,4,power_law_1.01,0.5322175979614258
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,7168,2048,8,256,1,4,power_law_1.01,5.923065567016602
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,7168,2048,8,256,1,4,balanced,2.9513867696126304
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,7168,2048,8,256,1,4,power_law_1.01,0.5356863975524903
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,7168,2048,8,256,1,4,power_law_1.01,0.15185920000076295
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,7168,2048,8,256,1,4,power_law_1.01,7.136070251464844
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,256,1,4,balanced,2.600639979044596
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,7168,2048,8,256,1,4,power_law_1.01,0.5662271976470947
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,7168,2048,8,256,1,4,balanced,5.316405296325684
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,7168,2048,8,256,1,4,power_law_1.01,0.2247231960296631
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,7168,2048,8,256,1,4,power_law_1.01,0.5597631931304932
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,7168,2048,8,256,1,4,power_law_1.01,11.575833892822265
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,7168,2048,8,256,1,4,power_law_1.01,0.14065279960632324
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,7168,2048,8,256,1,4,power_law_1.01,0.20608000755310057
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,7168,2048,8,256,1,4,power_law_1.01,0.595084810256958
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,7168,2048,8,256,1,4,power_law_1.01,0.30382719039916994
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,7168,2048,8,256,1,4,power_law_1.01,0.6152063846588135
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,7168,2048,8,256,1,4,power_law_1.01,20.858412170410155
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,7168,2048,8,256,1,4,power_law_1.01,0.38417279720306396
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,256,1,4,balanced,3.873141288757324
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,7168,2048,8,256,1,4,power_law_1.01,0.6130623817443848
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,7168,2048,8,256,1,4,power_law_1.01,0.5132991790771484
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,7168,2048,8,256,1,4,power_law_1.01,0.6810304164886475
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,7168,2048,8,256,1,4,power_law_1.01,0.564140796661377
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,7168,2048,8,256,1,4,power_law_1.01,0.6972544193267822
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,7168,2048,8,256,1,4,balanced,3.590810775756836
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,7168,2048,8,256,1,4,power_law_1.01,0.5669760227203369
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,7168,2048,8,256,1,4,power_law_1.01,0.768287992477417
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,7168,2048,8,256,1,4,power_law_1.01,0.8933631896972656
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,7168,2048,8,256,1,4,power_law_1.01,0.5826623916625977
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,7168,2048,8,256,1,4,power_law_1.01,0.8694656372070313
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,7168,2048,8,256,1,4,power_law_1.01,0.6429312229156494
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,7168,2048,8,256,1,4,power_law_1.01,1.092953586578369
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,7168,2048,8,256,1,4,power_law_1.01,1.0311488151550292
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,7168,2048,8,256,1,4,power_law_1.01,0.6374720096588135
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,256,1,4,balanced,5.19598929087321
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,7168,2048,8,256,1,4,power_law_1.01,1.221132755279541
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,7168,2048,8,256,1,4,power_law_1.01,0.7010176181793213
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,7168,2048,8,256,1,4,power_law_1.01,1.4011327743530273
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,7168,2048,8,256,1,4,balanced,8.321173350016275
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,7168,2048,8,256,1,4,power_law_1.01,0.7524799823760986
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,7168,2048,8,256,1,4,power_law_1.01,1.7715904235839843
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,7168,2048,8,256,1,4,power_law_1.01,0.8078144073486329
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,7168,2048,8,256,1,4,power_law_1.01,2.202329635620117
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,7168,2048,8,256,1,4,power_law_1.01,0.866585636138916
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,7168,2048,8,256,1,4,power_law_1.01,0.999289608001709
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,7168,2048,8,256,1,4,power_law_1.01,2.991539192199707
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,7168,2048,8,256,1,4,power_law_1.01,3.6688961029052733
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,7168,2048,8,256,1,4,power_law_1.01,4.826393508911133
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,7168,2048,8,256,1,4,power_law_1.01,1.0004863739013672
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,7168,2048,8,256,1,4,power_law_1.01,7.365843200683594
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,256,1,4,balanced,6.482880274454753
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,7168,2048,8,256,1,4,balanced,5.625258763631185
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,256,1,4,power_law_1.01,0.9899776458740235
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,256,1,4,power_law_1.01,1.2310400009155273
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,7168,2048,8,256,1,4,power_law_1.01,13.533517456054687
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,7168,2048,8,256,1,4,power_law_1.2,0.22272639274597167
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,256,1,4,power_law_1.01,1.3991359710693358
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,256,1,4,power_law_1.01,1.6632320404052734
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,7168,2048,8,256,1,4,power_law_1.2,0.3457279920578003
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,256,1,4,power_law_1.01,2.086150360107422
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,7168,2048,8,256,1,4,power_law_1.2,0.18301440477371217
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,256,1,4,power_law_1.01,2.8182655334472657
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,7168,2048,8,256,1,4,power_law_1.2,0.2814719915390015
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,256,1,4,power_law_1.01,3.593337631225586
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,7168,2048,8,256,1,4,power_law_1.2,0.4800704002380371
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,256,1,4,power_law_1.01,5.289683151245117
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,7168,2048,8,256,1,4,power_law_1.2,0.6432767868041992
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,256,1,4,power_law_1.01,6.547385406494141
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,7168,2048,8,256,1,4,power_law_1.2,0.8959744453430176
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,7168,2048,8,256,1,4,power_law_1.2,0.9942336082458496
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,256,1,4,power_law_1.01,8.177216339111329
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,7168,2048,8,256,1,4,power_law_1.2,0.9931391716003418
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,7168,2048,8,256,1,4,power_law_1.2,1.0552191734313965
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,256,1,4,balanced,10.604474385579428
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,256,1,4,power_law_1.01,12.408223724365234
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,7168,2048,8,256,1,4,power_law_1.2,1.1166912078857423
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,7168,2048,8,256,1,4,power_law_1.2,1.1943936347961426
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,7168,2048,8,256,1,4,power_law_1.2,1.2713983535766602
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,7168,2048,8,256,1,4,power_law_1.2,1.225164794921875
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,256,1,4,power_law_1.01,27.310528564453126
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,7168,2048,8,256,1,4,power_law_1.2,1.2742976188659667
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,7168,2048,8,256,1,4,power_law_1.2,0.13337600231170654
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,7168,2048,8,256,1,4,power_law_1.2,1.3646271705627442
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,7168,2048,8,256,1,4,balanced,16.322677612304688
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,7168,2048,8,256,1,4,power_law_1.2,1.4745087623596191
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,7168,2048,8,256,1,4,power_law_1.2,0.19422719478607178
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,7168,2048,8,256,1,4,power_law_1.2,1.6709632873535156
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,7168,2048,8,256,1,4,power_law_1.2,0.11216000318527222
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,7168,2048,8,256,1,4,power_law_1.2,1.7610048294067382
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,7168,2048,8,256,1,4,power_law_1.2,0.1720896005630493
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,7168,2048,8,256,1,4,power_law_1.2,2.297446441650391
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,7168,2048,8,256,1,4,power_law_1.2,1.9422975540161134
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,7168,2048,8,256,1,4,power_law_1.2,0.24021759033203124
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,7168,2048,8,256,1,4,power_law_1.2,2.172550392150879
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,7168,2048,8,256,1,4,power_law_1.2,0.3246272087097168
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,7168,2048,8,256,1,4,power_law_1.2,2.4883455276489257
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,7168,2048,8,256,1,4,power_law_1.2,0.4694784164428711
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,7168,2048,8,256,1,4,power_law_1.2,3.084351921081543
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,7168,2048,8,256,1,4,balanced,11.046277364095053
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,7168,2048,8,256,1,4,power_law_1.2,0.5462912082672119
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,7168,2048,8,256,1,4,power_law_1.2,3.5036865234375
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,7168,2048,8,256,1,4,power_law_1.2,5.11080322265625
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,7168,2048,8,256,1,4,power_law_1.2,0.5592512130737305
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,7168,2048,8,256,1,4,power_law_1.2,0.5464191913604737
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,7168,2048,8,256,1,4,power_law_1.2,6.686457824707031
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,7168,2048,8,256,1,4,power_law_1.2,0.5816703796386719
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,7168,2048,8,256,1,4,power_law_1.2,7.67484130859375
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,7168,2048,8,256,1,4,power_law_1.2,0.6315392017364502
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,7168,2048,8,256,1,4,power_law_1.2,12.427776336669922
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,7168,2048,8,256,1,4,power_law_1.2,0.6260096073150635
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,7168,2048,8,256,1,4,power_law_1.2,0.6526016235351563
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,7168,2048,8,256,1,4,power_law_1.2,25.205593872070313
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,7168,2048,8,256,1,4,power_law_1.2,0.703001594543457
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,7168,2048,8,256,1,4,power_law_1.2,0.7337408065795898
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,7168,2048,8,256,1,4,power_law_1.2,0.7853184223175049
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,7168,2048,8,256,1,4,power_law_1.2,0.9453439712524414
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,256,1,4,balanced,21.46819814046224
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,7168,2048,8,256,1,4,power_law_1.2,0.9640895843505859
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,7168,2048,8,256,1,4,power_law_1.2,1.176243209838867
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,7168,2048,8,256,1,4,power_law_1.2,1.0935935974121094
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,7168,2048,8,256,1,4,power_law_1.2,1.3298048019409179
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,7168,2048,8,256,1,4,power_law_1.2,1.5228992462158204
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,7168,2048,8,256,1,4,power_law_1.2,1.9989568710327148
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,7168,2048,8,256,1,4,power_law_1.2,2.498259162902832
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,7168,2048,8,256,1,4,power_law_1.2,3.428416061401367
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,7168,2048,8,256,1,4,power_law_1.2,4.498585510253906
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,7168,2048,8,256,1,4,power_law_1.2,5.531039810180664
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,7168,2048,8,256,1,4,power_law_1.2,8.840402984619141
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,7168,2048,8,256,1,4,power_law_1.2,16.472026062011718
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,7168,2048,8,256,1,4,power_law_1.2,0.14320000410079955
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,7168,2048,8,256,1,4,power_law_1.2,0.22447359561920166
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,7168,2048,8,256,1,4,power_law_1.2,0.11267199516296386
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,7168,2048,8,256,1,4,power_law_1.2,0.1784000039100647
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,7168,2048,8,256,1,4,power_law_1.2,0.2601664066314697
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,7168,2048,8,256,1,4,power_law_1.2,0.36074879169464114
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,7168,2048,8,256,1,4,power_law_1.2,0.4943552017211914
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,7168,2048,8,256,1,4,power_law_1.2,0.5365119934082031
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,7168,2048,8,256,1,4,power_law_1.2,0.5535871982574463
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,7168,2048,8,256,1,4,power_law_1.2,0.5823423862457275
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,7168,2048,8,256,2,2,balanced,0.08742933471997578
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,7168,2048,8,256,1,4,power_law_1.2,0.621337604522705
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,7168,2048,8,256,2,2,balanced,0.12229866782824199
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,7168,2048,8,256,1,4,power_law_1.2,0.6900224208831787
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,7168,2048,8,256,2,2,balanced,0.2010506590207418
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,7168,2048,8,256,1,4,power_law_1.2,0.6895999908447266
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,7168,2048,8,256,2,2,balanced,0.36950933933258057
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,7168,2048,8,256,2,2,balanced,0.6936053435007731
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,7168,2048,8,256,1,4,power_law_1.2,0.7738880157470703
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,7168,2048,8,256,2,2,balanced,1.344096024831136
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,7168,2048,8,256,1,4,power_law_1.2,0.8264127731323242
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,7168,2048,8,256,2,2,balanced,1.345029354095459
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,7168,2048,8,256,1,4,power_law_1.2,0.922214412689209
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,7168,2048,8,256,2,2,balanced,1.3391413688659668
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,7168,2048,8,256,1,4,power_law_1.2,0.9825407981872558
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,7168,2048,8,256,2,2,balanced,1.3514506022135417
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,7168,2048,8,256,2,2,balanced,1.346186637878418
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,7168,2048,8,256,2,2,balanced,1.3475359280904133
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,7168,2048,8,256,1,4,power_law_1.2,1.0913344383239747
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,7168,2048,8,256,2,2,balanced,1.3513813018798828
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,7168,2048,8,256,2,2,balanced,1.3583040237426758
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,7168,2048,8,256,2,2,balanced,1.3755520184834797
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,256,1,4,power_law_1.2,1.0204480171203614
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,7168,2048,8,256,2,2,balanced,1.3812959988911946
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,7168,2048,8,256,2,2,balanced,1.39301331837972
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,256,1,4,power_law_1.2,1.3017087936401368
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,7168,2048,8,256,2,2,balanced,1.4086400667826335
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,256,1,4,power_law_1.2,1.5940159797668456
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,256,1,4,power_law_1.2,1.8001983642578125
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,7168,2048,8,256,2,2,balanced,1.4803253809611003
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,256,1,4,power_law_1.2,2.0458303451538087
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,7168,2048,8,256,2,2,balanced,1.512880007425944
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,256,1,4,power_law_1.2,3.2054080963134766
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,7168,2048,8,256,2,2,balanced,1.5643733342488606
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,256,1,4,power_law_1.2,3.7956417083740233
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,7168,2048,8,256,2,2,balanced,1.6736960411071777
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,256,1,4,power_law_1.2,5.701804733276367
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,7168,2048,8,256,2,2,balanced,0.06598400076230367
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,7168,2048,8,256,2,2,balanced,0.0842186709245046
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,7168,2048,8,256,2,2,balanced,1.8043626149495442
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,256,1,4,power_law_1.2,7.563148498535156
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,7168,2048,8,256,2,2,balanced,0.12518399953842163
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,7168,2048,8,256,2,2,balanced,0.21331733465194702
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,7168,2048,8,256,2,2,balanced,0.37440534432729083
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,256,1,4,power_law_1.2,10.104115295410157
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,7168,2048,8,256,2,2,balanced,1.9090506235758464
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,7168,2048,8,256,2,2,balanced,0.7099040349324545
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,7168,2048,8,256,2,2,balanced,0.7105013529459635
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,7168,2048,8,256,2,2,balanced,0.7090346813201904
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,256,1,4,power_law_1.2,16.940179443359376
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,7168,2048,8,256,2,2,balanced,0.7188906669616699
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,7168,2048,8,256,2,2,power_law_1.01,0.13211519718170167
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,7168,2048,8,256,2,2,balanced,0.7231093247731527
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,7168,2048,8,256,2,2,balanced,2.5158079465230307
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,7168,2048,8,256,2,2,power_law_1.01,0.19886720180511475
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,7168,2048,8,256,2,2,balanced,0.7248906294504801
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,7168,2048,8,256,2,2,balanced,0.09089066584904988
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,7168,2048,8,256,2,2,balanced,0.7352960109710693
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,7168,2048,8,256,2,2,power_law_1.01,0.16427520513534546
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,256,1,4,power_law_1.2,29.229241943359376
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,7168,2048,8,256,2,2,balanced,0.10453866918881734
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,7168,2048,8,256,2,2,balanced,0.7441386381785074
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,7168,2048,8,256,2,2,power_law_1.01,0.3066751956939697
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,7168,2048,8,256,2,2,balanced,0.14867200454076132
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,7168,2048,8,256,2,2,balanced,0.7495253086090088
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,7168,2048,8,256,2,2,balanced,0.23641600211461386
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,7168,2048,8,256,2,2,power_law_1.01,0.4714943885803223
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,7168,2048,8,256,2,2,balanced,2.7066561381022134
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,7168,2048,8,256,2,2,balanced,0.7665386994679769
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,7168,2048,8,256,2,2,balanced,0.3917493422826131
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,7168,2048,8,256,2,2,balanced,0.7708586851755778
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,7168,2048,8,256,2,2,power_law_1.01,0.6317759990692139
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,7168,2048,8,256,2,2,balanced,0.7866026560465494
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,7168,2048,8,256,2,2,balanced,0.7141173680623373
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,7168,2048,8,256,2,2,power_law_1.01,0.08703359961509705
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,7168,2048,8,256,2,2,power_law_1.01,0.9408512115478516
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,7168,2048,8,256,2,2,balanced,0.8156747023264567
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,7168,2048,8,256,2,2,balanced,0.7188586393992106
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,7168,2048,8,256,2,2,power_law_1.01,0.12218879461288452
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,7168,2048,8,256,2,2,power_law_1.01,1.001747226715088
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,7168,2048,8,256,2,2,balanced,0.8724479675292969
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,7168,2048,8,256,2,2,balanced,0.7239147027333578
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,7168,2048,8,256,2,2,power_law_1.01,0.10840959548950195
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,7168,2048,8,256,2,2,balanced,0.7279733022054037
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,7168,2048,8,256,2,2,balanced,0.9355146884918213
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,7168,2048,8,256,2,2,power_law_1.01,1.041593647003174
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,7168,2048,8,256,2,2,balanced,3.76093324025472
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,7168,2048,8,256,2,2,power_law_1.01,0.18023040294647216
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,7168,2048,8,256,2,2,balanced,0.7299946943918864
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,7168,2048,8,256,2,2,power_law_1.01,1.0761088371276855
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,7168,2048,8,256,2,2,balanced,0.994757334391276
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,7168,2048,8,256,2,2,power_law_1.01,0.27306880950927737
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,7168,2048,8,256,2,2,balanced,0.7400853633880615
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,7168,2048,8,256,2,2,power_law_1.01,1.074880027770996
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,7168,2048,8,256,2,2,power_law_1.01,0.35710721015930175
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,7168,2048,8,256,2,2,balanced,0.7500320275624593
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,7168,2048,8,256,2,2,balanced,1.129578669865926
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,7168,2048,8,256,2,2,power_law_1.01,1.1354687690734864
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,7168,2048,8,256,2,2,balanced,0.757263978322347
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,7168,2048,8,256,2,2,power_law_1.01,0.5013887882232666
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,7168,2048,8,256,2,2,power_law_1.01,1.1403776168823243
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,7168,2048,8,256,2,2,balanced,0.7738933563232422
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,7168,2048,8,256,2,2,power_law_1.01,0.5154751777648926
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,7168,2048,8,256,2,2,balanced,1.2598346869150798
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,7168,2048,8,256,2,2,power_law_1.01,1.1848575592041015
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,7168,2048,8,256,2,2,balanced,0.7936106522878011
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,7168,2048,8,256,2,2,power_law_1.01,0.5504640102386474
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,7168,2048,8,256,2,2,power_law_1.01,1.223519992828369
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,7168,2048,8,256,2,2,balanced,4.975290616353353
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,7168,2048,8,256,2,2,balanced,0.8093492984771729
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,7168,2048,8,256,2,2,power_law_1.01,0.5665408134460449
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,7168,2048,8,256,2,2,power_law_1.01,0.11623680591583252
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,7168,2048,8,256,2,2,power_law_1.01,1.2579968452453614
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,7168,2048,8,256,2,2,balanced,1.714255968729655
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,7168,2048,8,256,2,2,balanced,0.8440907001495361
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,7168,2048,8,256,2,2,power_law_1.01,0.5878592014312745
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,7168,2048,8,256,2,2,power_law_1.01,0.15404160022735597
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,7168,2048,8,256,2,2,power_law_1.01,1.3614591598510741
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,7168,2048,8,256,2,2,power_law_1.01,0.1355072021484375
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,7168,2048,8,256,2,2,power_law_1.01,0.5986495971679687
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,7168,2048,8,256,2,2,power_law_1.01,0.19509119987487794
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,7168,2048,8,256,2,2,power_law_1.01,1.4954367637634278
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,7168,2048,8,256,2,2,power_law_1.01,0.6636415958404541
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,7168,2048,8,256,2,2,power_law_1.01,0.2888063907623291
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,7168,2048,8,256,2,2,power_law_1.01,0.6324480056762696
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,7168,2048,8,256,2,2,power_law_1.01,1.5754176139831544
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,7168,2048,8,256,2,2,power_law_1.01,0.36862080097198485
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,7168,2048,8,256,2,2,balanced,1.9468800226847331
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,7168,2048,8,256,2,2,power_law_1.01,0.6693247795104981
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,7168,2048,8,256,2,2,power_law_1.01,0.5115456104278564
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,7168,2048,8,256,2,2,balanced,0.9508586724599203
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,7168,2048,8,256,2,2,power_law_1.01,1.888844871520996
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,7168,2048,8,256,2,2,power_law_1.01,0.5704063892364502
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,7168,2048,8,256,2,2,power_law_1.01,0.6857088088989258
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,7168,2048,8,256,2,2,power_law_1.01,1.805120086669922
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,7168,2048,8,256,2,2,power_law_1.01,0.5871039867401123
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,7168,2048,8,256,2,2,power_law_1.01,0.7455359935760498
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,7168,2048,8,256,2,2,power_law_1.01,0.5751488208770752
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,7168,2048,8,256,2,2,power_law_1.01,2.150412750244141
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,7168,2048,8,256,2,2,balanced,6.601509094238281
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,7168,2048,8,256,2,2,power_law_1.01,0.8502400398254395
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,7168,2048,8,256,2,2,power_law_1.01,0.6313983917236328
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,7168,2048,8,256,2,2,power_law_1.01,0.6593664169311524
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,7168,2048,8,256,2,2,power_law_1.01,0.8579584121704101
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,7168,2048,8,256,2,2,power_law_1.01,2.2809215545654298
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,7168,2048,8,256,2,2,power_law_1.01,0.6950655937194824
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,7168,2048,8,256,2,2,balanced,2.774479866027832
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,7168,2048,8,256,2,2,power_law_1.01,1.0579263687133789
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,7168,2048,8,256,2,2,power_law_1.01,2.95731201171875
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,7168,2048,8,256,2,2,power_law_1.2,0.12117760181427002
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,7168,2048,8,256,2,2,power_law_1.01,0.7714047908782959
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,7168,2048,8,256,2,2,power_law_1.01,1.0364543914794921
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,7168,2048,8,256,2,2,power_law_1.01,0.813753604888916
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,7168,2048,8,256,2,2,power_law_1.01,3.5973758697509766
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,7168,2048,8,256,2,2,power_law_1.2,0.200927996635437
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,256,2,2,balanced,1.0502399603525798
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,7168,2048,8,256,2,2,power_law_1.01,1.2659071922302245
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,7168,2048,8,256,2,2,power_law_1.01,0.8968511581420898
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,7168,2048,8,256,2,2,power_law_1.2,0.16369279623031616
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,7168,2048,8,256,2,2,power_law_1.01,4.849292755126953
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,7168,2048,8,256,2,2,power_law_1.01,1.027660846710205
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,7168,2048,8,256,2,2,power_law_1.01,1.5200511932373046
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,256,2,2,balanced,1.2035626570383708
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,7168,2048,8,256,2,2,power_law_1.2,0.26477439403533937
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,7168,2048,8,256,2,2,power_law_1.01,1.9792512893676757
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,7168,2048,8,256,2,2,power_law_1.01,6.325856018066406
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,7168,2048,8,256,2,2,power_law_1.2,0.4136320114135742
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,256,2,2,balanced,1.3086293538411458
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,7168,2048,8,256,2,2,power_law_1.01,1.1360447883605957
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,7168,2048,8,256,2,2,power_law_1.01,2.405740737915039
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,7168,2048,8,256,2,2,power_law_1.01,7.44769287109375
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,7168,2048,8,256,2,2,power_law_1.2,0.5784063816070557
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,7168,2048,8,256,2,2,balanced,3.6231520970662436
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,7168,2048,8,256,2,2,power_law_1.01,3.239104080200195
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,256,2,2,balanced,1.733290672302246
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,7168,2048,8,256,2,2,power_law_1.2,0.8955776214599609
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,256,2,2,power_law_1.01,1.1146944046020508
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,7168,2048,8,256,2,2,power_law_1.01,4.195872116088867
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,7168,2048,8,256,2,2,power_law_1.01,11.518470764160156
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,7168,2048,8,256,2,2,power_law_1.2,0.9718463897705079
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,256,2,2,power_law_1.01,1.4066431999206543
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,7168,2048,8,256,2,2,power_law_1.01,4.9858238220214846
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,7168,2048,8,256,2,2,power_law_1.2,1.0069567680358886
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,256,2,2,power_law_1.01,1.6966079711914062
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,256,2,2,balanced,2.003328005472819
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,7168,2048,8,256,2,2,balanced,10.178415934244791
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,256,2,2,power_law_1.01,2.1172416687011717
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,7168,2048,8,256,2,2,power_law_1.2,1.0291135787963868
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,7168,2048,8,256,2,2,power_law_1.01,20.980230712890624
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,7168,2048,8,256,2,2,power_law_1.01,7.8283134460449215
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,256,2,2,power_law_1.01,2.514022445678711
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,7168,2048,8,256,2,2,power_law_1.2,1.0912575721740723
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,256,2,2,power_law_1.01,3.528460693359375
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,256,2,2,balanced,3.1308959325154624
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,7168,2048,8,256,2,2,power_law_1.2,1.1363136291503906
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,256,2,2,power_law_1.01,4.54692497253418
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,7168,2048,8,256,2,2,power_law_1.01,15.071282958984375
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,7168,2048,8,256,2,2,power_law_1.2,1.1810751914978028
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,7168,2048,8,256,2,2,balanced,4.419882774353027
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,256,2,2,power_law_1.01,6.426585388183594
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,7168,2048,8,256,2,2,power_law_1.2,1.240499210357666
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,256,2,2,power_law_1.01,8.151264190673828
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,7168,2048,8,256,2,2,power_law_1.2,1.2736895561218262
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,256,2,2,balanced,3.706080118815104
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,256,2,2,power_law_1.01,9.928627014160156
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,7168,2048,8,256,2,2,power_law_1.2,1.2825407981872559
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,7168,2048,8,256,2,2,power_law_1.2,1.4285120010375976
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,256,2,2,power_law_1.01,15.485491943359374
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,7168,2048,8,256,2,2,power_law_1.2,1.5213184356689453
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,7168,2048,8,256,2,2,power_law_1.2,1.696486473083496
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,256,2,2,power_law_1.01,32.44151611328125
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,256,2,2,balanced,5.464197158813477
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,7168,2048,8,256,2,2,power_law_1.2,2.0309120178222657
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,7168,2048,8,256,2,2,power_law_1.2,1.8924928665161134
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,7168,2048,8,256,2,2,power_law_1.2,2.223334312438965
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,7168,2048,8,256,2,2,power_law_1.2,2.5096384048461915
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,7168,2048,8,256,2,2,balanced,7.201487859090169
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,7168,2048,8,256,2,2,power_law_1.2,3.226425552368164
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,7168,2048,8,256,2,2,power_law_1.2,3.8148094177246095
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,256,2,2,balanced,7.339141209920247
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,7168,2048,8,256,2,2,power_law_1.2,5.068044662475586
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,7168,2048,8,256,2,2,power_law_1.2,6.649517059326172
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,7168,2048,8,256,2,2,power_law_1.2,7.993516540527343
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,7168,2048,8,256,2,2,balanced,19.102731068929035
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,7168,2048,8,256,2,2,power_law_1.2,12.964813232421875
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,7168,2048,8,256,2,2,power_law_1.2,23.370343017578126
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,256,2,2,balanced,9.129653294881185
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,7168,2048,8,256,2,2,power_law_1.2,0.08737279772758484
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,7168,2048,8,256,2,2,power_law_1.2,0.12079999446868897
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,7168,2048,8,256,2,2,power_law_1.2,0.10784000158309937
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,7168,2048,8,256,2,2,balanced,14.287551879882812
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,7168,2048,8,256,2,2,power_law_1.2,0.17624319791793824
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,256,2,2,balanced,14.90729014078776
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,7168,2048,8,256,2,2,power_law_1.2,0.24110078811645508
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,7168,2048,8,256,2,2,power_law_1.2,0.31734399795532225
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,7168,2048,8,256,2,2,power_law_1.2,0.47358717918396
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,7168,2048,8,256,2,2,power_law_1.2,0.4879615783691406
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,7168,2048,8,256,2,2,power_law_1.2,0.5412032127380371
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,7168,2048,8,256,2,2,power_law_1.2,0.5796607971191406
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,7168,2048,8,256,2,2,power_law_1.2,0.6093056201934814
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,7168,2048,8,256,2,2,power_law_1.2,0.604582405090332
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,7168,2048,8,256,2,2,power_law_1.2,0.653439998626709
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,7168,2048,8,256,2,2,power_law_1.2,0.6604928016662598
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,7168,2048,8,256,2,2,power_law_1.2,0.7035711765289306
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,7168,2048,8,256,2,2,power_law_1.2,0.732096004486084
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,7168,2048,8,256,2,2,power_law_1.2,0.769536018371582
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,7168,2048,8,256,2,2,power_law_1.2,0.9191807746887207
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,7168,2048,8,256,2,2,power_law_1.2,0.897760009765625
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,7168,2048,8,256,2,2,power_law_1.2,1.070751953125
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,7168,2048,8,256,2,2,power_law_1.2,1.0963583946228028
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,7168,2048,8,256,2,2,power_law_1.2,1.3172287940979004
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,7168,2048,8,256,2,2,power_law_1.2,1.6197824478149414
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,7168,2048,8,256,2,2,power_law_1.2,2.1092607498168947
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,7168,2048,8,256,2,2,power_law_1.2,2.4524288177490234
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,7168,2048,8,256,2,2,power_law_1.2,3.523321533203125
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,256,2,2,balanced,29.950174967447918
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,7168,2048,8,256,2,2,power_law_1.2,4.433433532714844
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,7168,2048,8,256,2,2,power_law_1.2,5.120377731323242
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,7168,2048,8,256,2,2,power_law_1.2,8.533273315429687
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,7168,2048,8,256,2,2,power_law_1.2,17.037298583984374
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,7168,2048,8,256,2,2,power_law_1.2,0.1130944013595581
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,7168,2048,8,256,2,2,power_law_1.2,0.1494976043701172
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,7168,2048,8,256,4,1,balanced,0.08925333619117737
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,7168,2048,8,256,2,2,power_law_1.2,0.12211840152740479
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,7168,2048,8,256,4,1,balanced,0.12469333410263062
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,7168,2048,8,256,2,2,power_law_1.2,0.18373119831085205
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,7168,2048,8,256,4,1,balanced,0.204202671845754
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,7168,2048,8,256,2,2,power_law_1.2,0.25109760761260985
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,7168,2048,8,256,4,1,balanced,0.37878934542338055
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,7168,2048,8,256,2,2,power_law_1.2,0.3377919912338257
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,7168,2048,8,256,4,1,balanced,0.694922685623169
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,7168,2048,8,256,2,2,power_law_1.2,0.5226111888885498
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,7168,2048,8,256,4,1,balanced,1.3538773854573567
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,7168,2048,8,256,4,1,balanced,1.3604906400044758
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,7168,2048,8,256,2,2,power_law_1.2,0.5403840065002441
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,7168,2048,8,256,4,1,balanced,1.3577173550923665
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,7168,2048,8,256,4,1,balanced,0.06856533388296764
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,7168,2048,8,256,2,2,power_law_1.2,0.5745728015899658
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,7168,2048,8,256,4,1,balanced,1.372586727142334
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,7168,2048,8,256,4,1,balanced,0.08876799543698628
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,7168,2048,8,256,2,2,power_law_1.2,0.5956799983978271
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,7168,2048,8,256,4,1,balanced,1.3627893129984539
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,7168,2048,8,256,4,1,balanced,0.13184533516565958
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,7168,2048,8,256,2,2,power_law_1.2,0.630783987045288
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,7168,2048,8,256,4,1,balanced,1.3824960390726726
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,7168,2048,8,256,4,1,balanced,0.2241599957148234
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,7168,2048,8,256,2,2,power_law_1.2,0.6547135829925537
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,7168,2048,8,256,4,1,balanced,1.3920693397521973
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,7168,2048,8,256,4,1,balanced,0.39743999640146893
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,7168,2048,8,256,2,2,power_law_1.2,0.7104832172393799
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,7168,2048,8,256,4,1,balanced,1.4148532549540203
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,7168,2048,8,256,4,1,balanced,0.7201653321584066
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,7168,2048,8,256,2,2,power_law_1.2,0.7699135780334473
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,7168,2048,8,256,4,1,balanced,0.72707732518514
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,7168,2048,8,256,4,1,balanced,1.4032266934712727
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,7168,2048,8,256,2,2,power_law_1.2,0.8463168144226074
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,7168,2048,8,256,4,1,balanced,0.7324906984965006
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,7168,2048,8,256,4,1,balanced,1.415455977121989
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,7168,2048,8,256,2,2,power_law_1.2,0.9214400291442871
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,7168,2048,8,256,4,1,balanced,0.7396319707234701
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,7168,2048,8,256,4,1,balanced,1.4259947141011555
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,7168,2048,8,256,2,2,power_law_1.2,1.0447168350219727
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,7168,2048,8,256,4,1,balanced,0.7479946613311768
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,7168,2048,8,256,4,1,balanced,1.4390239715576172
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,7168,2048,8,256,4,1,balanced,0.7498186429341634
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,7168,2048,8,256,4,1,balanced,0.7608160177866617
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,7168,2048,8,256,4,1,balanced,1.5378185907999675
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,7168,2048,8,256,2,2,power_law_1.2,1.1632703781127929
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,7168,2048,8,256,4,1,balanced,0.7667679786682129
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,7168,2048,8,256,4,1,balanced,1.6152532895406086
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,7168,2048,8,256,4,1,balanced,0.7835520108540853
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,256,2,2,power_law_1.2,1.187443161010742
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,7168,2048,8,256,4,1,balanced,0.8033813635508219
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,7168,2048,8,256,4,1,balanced,1.703279972076416
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,256,2,2,power_law_1.2,1.484761619567871
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,7168,2048,8,256,4,1,power_law_1.01,0.08833919763565064
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,7168,2048,8,256,4,1,balanced,0.8219199975331625
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,7168,2048,8,256,4,1,balanced,1.813360055287679
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,256,2,2,power_law_1.2,1.7209856033325195
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,7168,2048,8,256,4,1,balanced,0.8601280053456625
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,7168,2048,8,256,4,1,power_law_1.01,0.12377599477767945
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,256,2,2,power_law_1.2,2.072102355957031
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,7168,2048,8,256,4,1,power_law_1.01,0.14415359497070312
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,7168,2048,8,256,4,1,balanced,0.896405299504598
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,7168,2048,8,256,4,1,balanced,2.029909292856852
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,7168,2048,8,256,4,1,power_law_1.01,0.27921280860900877
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,256,2,2,power_law_1.2,2.5557376861572267
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,7168,2048,8,256,4,1,balanced,0.13195199767748514
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,7168,2048,8,256,4,1,balanced,0.9679733117421468
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,7168,2048,8,256,4,1,power_law_1.01,0.44097280502319336
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,7168,2048,8,256,4,1,balanced,0.14415466785430908
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,256,2,2,power_law_1.2,3.497439956665039
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,7168,2048,8,256,4,1,balanced,1.0676906903584797
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,7168,2048,8,256,4,1,balanced,2.271968046824137
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,7168,2048,8,256,4,1,power_law_1.01,0.6322432041168213
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,7168,2048,8,256,4,1,balanced,0.18874132633209229
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,256,2,2,power_law_1.2,4.6478527069091795
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,7168,2048,8,256,4,1,balanced,0.28153600295384723
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,7168,2048,8,256,4,1,power_law_1.01,0.9545280456542968
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,7168,2048,8,256,4,1,balanced,1.1924800078074138
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,7168,2048,8,256,4,1,balanced,0.43908798694610596
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,256,2,2,power_law_1.2,6.749676513671875
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,7168,2048,8,256,4,1,power_law_1.01,1.0009023666381835
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,7168,2048,8,256,4,1,balanced,0.7941653728485107
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,7168,2048,8,256,4,1,balanced,2.989797274271647
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,7168,2048,8,256,4,1,power_law_1.01,1.019315242767334
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,7168,2048,8,256,4,1,balanced,1.3929972648620605
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,256,2,2,power_law_1.2,8.75702362060547
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,7168,2048,8,256,4,1,balanced,0.8032480080922445
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,7168,2048,8,256,4,1,power_law_1.01,0.06702079772949218
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,7168,2048,8,256,4,1,power_law_1.01,1.0798463821411133
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,7168,2048,8,256,4,1,balanced,0.8110026518503824
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,7168,2048,8,256,4,1,power_law_1.01,0.08572160005569458
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,256,2,2,power_law_1.2,10.930201721191406
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,7168,2048,8,256,4,1,power_law_1.01,0.09718400239944458
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,7168,2048,8,256,4,1,power_law_1.01,1.1093695640563965
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,7168,2048,8,256,4,1,balanced,0.8181493282318115
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,7168,2048,8,256,4,1,balanced,1.617850621541341
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,7168,2048,8,256,4,1,power_law_1.01,0.18035839796066283
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,7168,2048,8,256,4,1,balanced,3.4162826538085938
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,7168,2048,8,256,4,1,balanced,0.8244000275929769
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,7168,2048,8,256,4,1,power_law_1.01,1.153536033630371
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,7168,2048,8,256,4,1,power_law_1.01,0.2640255928039551
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,256,2,2,power_law_1.2,17.7661376953125
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,7168,2048,8,256,4,1,balanced,0.8392053445180258
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,7168,2048,8,256,4,1,power_law_1.01,0.34828801155090333
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,7168,2048,8,256,4,1,power_law_1.01,1.16810884475708
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,7168,2048,8,256,4,1,power_law_1.01,0.49458560943603513
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,7168,2048,8,256,4,1,balanced,0.8537066777547201
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,7168,2048,8,256,4,1,balanced,2.2095840771993003
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,7168,2048,8,256,4,1,power_law_1.01,1.2188287734985352
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,7168,2048,8,256,4,1,power_law_1.01,0.5405439853668212
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,7168,2048,8,256,4,1,balanced,0.8690346876780192
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,7168,2048,8,256,4,1,power_law_1.01,0.5577919960021973
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,7168,2048,8,256,4,1,power_law_1.01,1.242246437072754
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,256,2,2,power_law_1.2,34.43110961914063
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,7168,2048,8,256,4,1,balanced,0.9013866583506266
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,7168,2048,8,256,4,1,power_law_1.01,0.5823999881744385
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,7168,2048,8,256,4,1,power_law_1.01,1.265875244140625
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,7168,2048,8,256,4,1,power_law_1.01,0.6220287799835205
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,7168,2048,8,256,4,1,balanced,0.9436373710632324
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,7168,2048,8,256,4,1,balanced,4.768666585286458
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,7168,2048,8,256,4,1,power_law_1.01,0.6650559902191162
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,7168,2048,8,256,4,1,power_law_1.01,1.3695360183715821
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,7168,2048,8,256,4,1,balanced,0.9796586831410726
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,7168,2048,8,256,4,1,balanced,2.6742614110310874
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,7168,2048,8,256,4,1,power_law_1.01,0.6877056121826172
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,7168,2048,8,256,4,1,power_law_1.01,1.5344511985778808
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,7168,2048,8,256,4,1,power_law_1.01,0.717523193359375
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,7168,2048,8,256,4,1,balanced,1.0426452954610188
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,7168,2048,8,256,4,1,power_law_1.01,0.7671999931335449
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,7168,2048,8,256,4,1,power_law_1.01,1.62030086517334
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,7168,2048,8,256,4,1,power_law_1.01,0.8104767799377441
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,7168,2048,8,256,4,1,power_law_1.01,0.8499199867248535
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,7168,2048,8,256,4,1,power_law_1.01,1.917344093322754
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,7168,2048,8,256,4,1,power_law_1.01,0.9431936264038085
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,7168,2048,8,256,4,1,power_law_1.01,1.864486312866211
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,7168,2048,8,256,4,1,power_law_1.01,0.9947775840759278
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,7168,2048,8,256,4,1,balanced,1.1994346777598064
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,7168,2048,8,256,4,1,balanced,3.8121493657430015
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,7168,2048,8,256,4,1,balanced,6.274527867635091
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,7168,2048,8,256,4,1,power_law_1.01,1.1601152420043945
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,7168,2048,8,256,4,1,power_law_1.01,2.1930431365966796
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,7168,2048,8,256,4,1,power_law_1.01,1.2331392288208007
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,7168,2048,8,256,4,1,power_law_1.01,2.537171173095703
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,7168,2048,8,256,4,1,power_law_1.01,1.5086079597473145
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,7168,2048,8,256,4,1,power_law_1.01,3.2248321533203126
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,7168,2048,8,256,4,1,power_law_1.01,1.766489601135254
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,7168,2048,8,256,4,1,power_law_1.01,3.9510337829589846
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,7168,2048,8,256,4,1,power_law_1.01,2.351807975769043
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,7168,2048,8,256,4,1,power_law_1.01,2.9366527557373048
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,7168,2048,8,256,4,1,power_law_1.01,5.460403060913086
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,256,4,1,balanced,1.4106720288594563
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,7168,2048,8,256,4,1,power_law_1.01,4.09117431640625
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,7168,2048,8,256,4,1,power_law_1.01,6.954093170166016
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,7168,2048,8,256,4,1,balanced,4.924026807149251
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,256,4,1,balanced,1.7070719401041667
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,7168,2048,8,256,4,1,power_law_1.01,5.144153594970703
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,7168,2048,8,256,4,1,power_law_1.01,6.3040000915527346
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,7168,2048,8,256,4,1,power_law_1.01,8.480934143066406
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,7168,2048,8,256,4,1,balanced,7.6187788645426435
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,256,4,1,balanced,1.8908586502075195
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,7168,2048,8,256,4,1,power_law_1.01,9.807955169677735
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,7168,2048,8,256,4,1,power_law_1.01,13.753018188476563
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,256,4,1,balanced,2.6110453605651855
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,7168,2048,8,256,4,1,power_law_1.01,20.618316650390625
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,7168,2048,8,256,4,1,power_law_1.01,26.33417663574219
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,256,4,1,balanced,3.061552047729492
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,7168,2048,8,256,4,1,balanced,6.349370956420898
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,256,4,1,balanced,4.755903879801433
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,7168,2048,8,256,4,1,power_law_1.01,0.12210559844970703
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,7168,2048,8,256,4,1,power_law_1.01,0.14494719505310058
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,7168,2048,8,256,4,1,power_law_1.01,0.15412479639053345
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,256,4,1,balanced,5.784933090209961
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,7168,2048,8,256,4,1,power_law_1.01,0.23080320358276368
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,7168,2048,8,256,4,1,power_law_1.2,0.08797439932823181
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,7168,2048,8,256,4,1,balanced,12.44480005900065
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,7168,2048,8,256,4,1,power_law_1.01,0.3247488021850586
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,7168,2048,8,256,4,1,power_law_1.2,0.12023680210113526
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,7168,2048,8,256,4,1,power_law_1.2,0.1512511968612671
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,7168,2048,8,256,4,1,power_law_1.01,0.414188814163208
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,7168,2048,8,256,4,1,power_law_1.01,0.5732607841491699
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,7168,2048,8,256,4,1,power_law_1.2,0.2710975885391235
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,7168,2048,8,256,4,1,power_law_1.2,0.4133120059967041
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,7168,2048,8,256,4,1,power_law_1.01,0.6172480106353759
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,256,4,1,balanced,8.604069391886393
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,7168,2048,8,256,4,1,power_law_1.2,0.5219136238098144
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,7168,2048,8,256,4,1,power_law_1.01,0.6310719966888427
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,7168,2048,8,256,4,1,balanced,9.558746973673502
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,7168,2048,8,256,4,1,power_law_1.2,0.8873984336853027
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,7168,2048,8,256,4,1,power_law_1.01,0.6514368057250977
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,7168,2048,8,256,4,1,power_law_1.01,0.6949440002441406
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,7168,2048,8,256,4,1,power_law_1.2,0.9700480461120605
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,7168,2048,8,256,4,1,power_law_1.01,0.740934419631958
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,7168,2048,8,256,4,1,power_law_1.2,0.9954943656921387
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,7168,2048,8,256,4,1,power_law_1.2,1.0376832008361816
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,7168,2048,8,256,4,1,power_law_1.01,0.7803008079528808
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,7168,2048,8,256,4,1,power_law_1.2,1.0804863929748536
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,7168,2048,8,256,4,1,power_law_1.01,0.8567359924316407
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,256,4,1,balanced,11.414037068684896
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,7168,2048,8,256,4,1,power_law_1.2,1.1694144248962401
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,7168,2048,8,256,4,1,power_law_1.01,0.9496000289916993
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,7168,2048,8,256,4,1,power_law_1.2,1.1951423645019532
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,7168,2048,8,256,4,1,power_law_1.01,1.0201024055480956
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,7168,2048,8,256,4,1,power_law_1.2,1.2208703994750976
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,7168,2048,8,256,4,1,power_law_1.01,1.1793279647827148
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,7168,2048,8,256,4,1,power_law_1.2,1.297036838531494
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,7168,2048,8,256,4,1,power_law_1.2,1.36746244430542
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,7168,2048,8,256,4,1,power_law_1.01,1.3154239654541016
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,7168,2048,8,256,4,1,power_law_1.2,1.4521599769592286
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,7168,2048,8,256,4,1,power_law_1.2,1.6288639068603517
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,256,4,1,balanced,14.241994222005209
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,7168,2048,8,256,4,1,power_law_1.2,1.713587188720703
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,256,4,1,power_law_1.01,1.4163647651672364
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,7168,2048,8,256,4,1,power_law_1.2,2.0122304916381837
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,256,4,1,power_law_1.01,1.7879167556762696
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,256,4,1,power_law_1.01,2.1670400619506838
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,7168,2048,8,256,4,1,power_law_1.2,1.9007104873657226
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,7168,2048,8,256,4,1,balanced,25.218058268229168
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,256,4,1,power_law_1.01,2.7716415405273436
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,7168,2048,8,256,4,1,power_law_1.2,2.267500877380371
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,256,4,1,power_law_1.01,3.445964813232422
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,7168,2048,8,256,4,1,power_law_1.2,2.6532415390014648
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,256,4,1,power_law_1.01,4.82147216796875
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,7168,2048,8,256,4,1,power_law_1.2,3.377132797241211
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,256,4,1,power_law_1.01,6.1906688690185545
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,7168,2048,8,256,4,1,power_law_1.2,4.111449432373047
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,256,4,1,power_law_1.01,8.931922912597656
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,7168,2048,8,256,4,1,balanced,18.825733184814453
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,7168,2048,8,256,4,1,power_law_1.2,5.662847900390625
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,256,4,1,power_law_1.01,11.70447998046875
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,256,4,1,balanced,23.08447519938151
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,7168,2048,8,256,4,1,power_law_1.2,7.132109069824219
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,7168,2048,8,256,4,1,power_law_1.2,8.651526641845702
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,256,4,1,power_law_1.01,14.447135925292969
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,7168,2048,8,256,4,1,power_law_1.2,14.113235473632812
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,256,4,1,power_law_1.01,22.80518341064453
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,7168,2048,8,256,4,1,power_law_1.2,26.375796508789062
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,256,4,1,power_law_1.01,45.307681274414065
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,7168,2048,8,256,4,1,power_law_1.2,0.06689919829368592
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,7168,2048,8,256,4,1,power_law_1.2,0.08602880239486695
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,7168,2048,8,256,4,1,power_law_1.2,0.10094720125198364
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,7168,2048,8,256,4,1,power_law_1.2,0.15783679485321045
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,7168,2048,8,256,4,1,power_law_1.2,0.23297278881072997
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,7168,2048,8,256,4,1,power_law_1.2,0.31058559417724607
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,7168,2048,8,256,4,1,power_law_1.2,0.4791168212890625
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,7168,2048,8,256,4,1,power_law_1.2,0.5192128181457519
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,7168,2048,8,256,4,1,power_law_1.2,0.5686079978942871
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,7168,2048,8,256,4,1,power_law_1.2,0.5770624160766602
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,7168,2048,8,256,4,1,power_law_1.2,0.6068480014801025
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,7168,2048,8,256,4,1,power_law_1.2,0.6669312000274659
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,7168,2048,8,256,4,1,power_law_1.2,0.6795008182525635
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,7168,2048,8,256,4,1,power_law_1.2,0.7181951999664307
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,7168,2048,8,256,4,1,power_law_1.2,0.7595071792602539
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,256,4,1,balanced,46.80699666341146
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,7168,2048,8,256,4,1,power_law_1.2,0.8135616302490234
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,7168,2048,8,256,4,1,power_law_1.2,0.8584832191467285
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,7168,2048,8,256,4,1,power_law_1.2,0.9974528312683105
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,7168,2048,8,256,4,1,power_law_1.2,1.0221247673034668
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,2048,768,8,128,1,4,balanced,0.03014933317899704
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,7168,2048,8,256,4,1,power_law_1.2,1.202560043334961
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,2048,768,8,128,1,4,balanced,0.03209066639343897
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,7168,2048,8,256,4,1,power_law_1.2,0.12360320091247559
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,7168,2048,8,256,4,1,power_law_1.2,1.290611171722412
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,2048,768,8,128,1,4,balanced,0.04298666616280874
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,7168,2048,8,256,4,1,power_law_1.2,1.5575296401977539
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,7168,2048,8,256,4,1,power_law_1.2,0.14317439794540404
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,2048,768,8,128,1,4,balanced,0.0624533345301946
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,7168,2048,8,256,4,1,power_law_1.2,1.842438316345215
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,7168,2048,8,256,4,1,power_law_1.2,0.1530943989753723
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,2048,768,8,128,1,4,balanced,0.0988159974416097
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,2048,768,8,128,1,4,balanced,0.09955199559529622
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,7168,2048,8,256,4,1,power_law_1.2,0.22254719734191894
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,7168,2048,8,256,4,1,power_law_1.2,2.4223424911499025
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,2048,768,8,128,1,4,balanced,0.09876267115275066
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,7168,2048,8,256,4,1,power_law_1.2,0.275929594039917
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,7168,2048,8,256,4,1,power_law_1.2,2.9712383270263674
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,2048,768,8,128,1,4,balanced,0.09995733698209126
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,7168,2048,8,256,4,1,power_law_1.2,0.37794559001922606
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,7168,2048,8,256,4,1,power_law_1.2,4.121068954467773
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,2048,768,8,128,1,4,balanced,0.10059199730555217
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,7168,2048,8,256,4,1,power_law_1.2,0.5651072025299072
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,2048,768,8,128,1,4,balanced,0.10038933157920837
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,7168,2048,8,256,4,1,power_law_1.2,5.483801651000976
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,7168,2048,8,256,4,1,power_law_1.2,0.6032639980316162
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,2048,768,8,128,1,4,balanced,0.10142933328946431
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,7168,2048,8,256,4,1,power_law_1.2,0.6238399982452393
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,2048,768,8,128,1,4,balanced,0.10317867000897725
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,7168,2048,8,256,4,1,power_law_1.2,6.698880004882812
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,7168,2048,8,256,4,1,power_law_1.2,0.6579904079437255
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,2048,768,8,128,1,4,balanced,0.10315199693044026
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,7168,2048,8,256,4,1,power_law_1.2,0.6941184043884278
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,2048,768,8,128,1,4,balanced,0.10578133662541707
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,7168,2048,8,256,4,1,power_law_1.2,10.356575775146485
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,2048,768,8,128,1,4,balanced,0.11460266510645549
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,7168,2048,8,256,4,1,power_law_1.2,0.7495423793792725
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,2048,768,8,128,1,4,balanced,0.11706133683522542
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,7168,2048,8,256,4,1,power_law_1.2,0.7949888229370117
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,7168,2048,8,256,4,1,power_law_1.2,20.60425567626953
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,2048,768,8,128,1,4,balanced,0.11972799897193909
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,7168,2048,8,256,4,1,power_law_1.2,0.8756223678588867
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,2048,768,8,128,1,4,balanced,0.12681066989898682
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,7168,2048,8,256,4,1,power_law_1.2,0.972544002532959
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,7168,2048,8,256,4,1,power_law_1.2,1.0456512451171875
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,2048,768,8,128,1,4,balanced,0.13479999701182047
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,7168,2048,8,256,4,1,power_law_1.2,1.193446445465088
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,2048,768,8,128,1,4,balanced,0.14525333046913147
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,2048,768,8,128,1,4,balanced,0.16803733507792154
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,7168,2048,8,256,4,1,power_law_1.2,1.3766783714294433
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,2048,768,8,128,1,4,balanced,0.19622933864593506
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,256,4,1,power_law_1.2,1.4604479789733886
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,2048,768,8,128,1,4,balanced,0.21361599365870157
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,256,4,1,power_law_1.2,1.825119972229004
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,256,4,1,power_law_1.2,2.2167743682861327
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,2048,768,8,128,1,4,balanced,0.03253866732120514
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,256,4,1,power_law_1.2,2.8439807891845703
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,2048,768,8,128,1,4,balanced,0.3004586696624756
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,2048,768,8,128,1,4,balanced,0.03310933212439219
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,256,4,1,power_law_1.2,3.5298622131347654
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,2048,768,8,128,1,4,balanced,0.034128000338872276
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,2048,768,8,128,1,4,balanced,0.05202133456865946
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,256,4,1,power_law_1.2,4.870598220825196
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,2048,768,8,128,1,4,balanced,0.07297599812348683
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,2048,768,8,128,1,4,balanced,0.07157333195209503
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,256,4,1,power_law_1.2,6.251513671875
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,2048,768,8,128,1,4,balanced,0.07241066793600719
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,2048,768,8,128,1,4,balanced,0.36770133177439374
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,2048,768,8,128,1,4,balanced,0.07188266515731812
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,256,4,1,power_law_1.2,8.978713226318359
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,2048,768,8,128,1,4,balanced,0.07204799850781758
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,2048,768,8,128,1,4,balanced,0.07349333167076111
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,2048,768,8,128,1,4,balanced,0.07461333274841309
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,256,4,1,power_law_1.2,11.724332427978515
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,2048,768,8,128,1,4,balanced,0.0761706680059433
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,2048,768,8,128,1,4,balanced,0.07619200150171916
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,2048,768,8,128,1,4,balanced,0.07795733213424683
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,256,4,1,power_law_1.2,14.463475036621094
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,2048,768,8,128,1,4,balanced,0.08359466989835103
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,2048,768,8,128,1,4,balanced,0.5321280161539713
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,2048,768,8,128,1,4,balanced,0.08406399687131245
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,2048,768,8,128,1,4,balanced,0.09033067027727763
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,256,4,1,power_law_1.2,22.72569580078125
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,2048,768,8,128,1,4,balanced,0.09804266691207886
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,2048,768,8,128,1,4,balanced,0.10772266983985901
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,2048,768,8,128,1,4,balanced,0.12084800004959106
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,2048,768,8,128,1,4,balanced,0.03107200066248576
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,2048,768,8,128,1,4,power_law_1.01,0.0442111998796463
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,256,4,1,power_law_1.2,44.96400756835938
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,2048,768,8,128,1,4,balanced,0.032442666590213776
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,2048,768,8,128,1,4,balanced,0.13471999764442444
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,2048,768,8,128,1,4,power_law_1.01,0.03961600065231323
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,2048,768,8,128,1,4,balanced,0.6959893703460693
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,2048,768,8,128,1,4,balanced,0.0345920001467069
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,2048,768,8,128,1,4,power_law_1.01,0.039654400944709775
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,2048,768,8,128,1,4,balanced,0.048021331429481506
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,2048,768,8,128,1,4,balanced,0.18743467330932617
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,2048,768,8,128,1,4,power_law_1.01,0.05554559826850891
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,2048,768,8,128,1,4,balanced,0.06710933148860931
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,2048,768,8,128,1,4,power_law_1.01,0.061312001943588254
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,2048,768,8,128,1,4,balanced,0.206112007300059
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,2048,768,8,128,1,4,balanced,0.06840533514817555
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,2048,768,8,128,1,4,power_law_1.01,0.08840320110321045
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,2048,768,8,128,1,4,balanced,0.06860266625881195
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,2048,768,8,128,1,4,power_law_1.01,0.09175040125846863
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,2048,768,8,128,1,4,power_law_1.01,0.036524799466133115
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,2048,768,8,128,1,4,balanced,0.06937600175539653
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,2048,768,8,128,1,4,balanced,0.2956213355064392
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,2048,768,8,128,1,4,power_law_1.01,0.09591040015220642
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,2048,768,8,128,1,4,balanced,0.07016000151634216
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,2048,768,8,128,1,4,power_law_1.01,0.03252480030059814
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,2048,768,8,128,1,4,power_law_1.01,0.09658880233764648
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,2048,768,8,128,1,4,balanced,0.07169066866238911
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,2048,768,8,128,1,4,power_law_1.01,0.035795199871063235
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,2048,768,8,128,1,4,balanced,0.859824021657308
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,2048,768,8,128,1,4,power_law_1.01,0.10302079916000366
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,2048,768,8,128,1,4,balanced,0.0721973329782486
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,2048,768,8,128,1,4,power_law_1.01,0.04581120014190674
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,2048,768,8,128,1,4,balanced,0.37380798657735187
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,2048,768,8,128,1,4,balanced,0.07375466823577881
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,2048,768,8,128,1,4,power_law_1.01,0.10090240240097045
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,2048,768,8,128,1,4,power_law_1.01,0.05255039930343628
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,2048,768,8,128,1,4,power_law_1.01,0.0670144021511078
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,2048,768,8,128,1,4,balanced,0.07483733197053273
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,2048,768,8,128,1,4,power_law_1.01,0.10609920024871826
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,2048,768,8,128,1,4,power_law_1.01,0.06775040030479432
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,2048,768,8,128,1,4,power_law_1.01,0.10927360057830811
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,2048,768,8,128,1,4,balanced,0.07779733339945476
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,2048,768,8,128,1,4,power_law_1.01,0.06922879815101624
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,2048,768,8,128,1,4,power_law_1.01,0.1117311954498291
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,2048,768,8,128,1,4,power_law_1.01,0.07023360133171082
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,2048,768,8,128,1,4,power_law_1.01,0.12113920450210572
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,2048,768,8,128,1,4,power_law_1.01,0.07178879976272583
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,2048,768,8,128,1,4,balanced,0.5443786780039469
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,2048,768,8,128,1,4,power_law_1.01,0.1257472038269043
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,2048,768,8,128,1,4,power_law_1.01,0.07408000230789184
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,2048,768,8,128,1,4,balanced,0.0862666666507721
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,2048,768,8,128,1,4,power_law_1.01,0.1300927996635437
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,2048,768,8,128,1,4,power_law_1.01,0.07816320061683654
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,2048,768,8,128,1,4,balanced,0.08721599976221721
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,2048,768,8,128,1,4,power_law_1.01,0.08106240034103393
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,2048,768,8,128,1,4,power_law_1.01,0.14343039989471434
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,2048,768,8,128,1,4,power_law_1.01,0.08213120102882385
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,2048,768,8,128,1,4,power_law_1.01,0.16049280166625976
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,2048,768,8,128,1,4,power_law_1.01,0.08759040236473084
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,2048,768,8,128,1,4,power_law_1.01,0.17815040349960326
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,2048,768,8,128,1,4,power_law_1.01,0.03377920091152191
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,2048,768,8,128,1,4,power_law_1.01,0.09545599818229675
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,2048,768,8,128,1,4,power_law_1.01,0.21736960411071776
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,2048,768,8,128,1,4,balanced,0.7138826847076416
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,2048,768,8,128,1,4,balanced,1.3399680455525715
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,2048,768,8,128,1,4,power_law_1.01,0.03454079926013946
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,2048,768,8,128,1,4,power_law_1.01,0.10117759704589843
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,2048,768,8,128,1,4,power_law_1.01,0.2678976058959961
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,2048,768,8,128,1,4,balanced,0.09769599636395772
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,2048,768,8,128,1,4,power_law_1.01,0.037273600697517395
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,2048,768,8,128,1,4,power_law_1.01,0.11451519727706909
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,2048,768,8,128,1,4,power_law_1.01,0.3118016004562378
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,2048,768,8,128,1,4,power_law_1.01,0.045388799905776975
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,2048,768,8,128,1,4,power_law_1.01,0.12476799488067628
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,2048,768,8,128,1,4,balanced,0.11190932989120483
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,2048,768,8,128,1,4,power_law_1.01,0.3864959955215454
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,2048,768,8,128,1,4,power_law_1.01,0.05306239724159241
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,2048,768,8,128,1,4,power_law_1.01,0.15425920486450195
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,2048,768,8,128,1,4,power_law_1.01,0.5074495792388916
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,2048,768,8,128,1,4,balanced,0.11704533298810323
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,2048,768,8,128,1,4,power_law_1.01,0.06446719765663148
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,2048,768,8,128,1,4,power_law_1.01,0.17484159469604493
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,2048,768,8,128,1,4,power_law_1.01,0.7433216094970703
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,2048,768,8,128,1,4,power_law_1.01,0.06577919721603394
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,2048,768,8,128,1,4,balanced,0.15350932876269022
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,2048,768,8,128,1,4,power_law_1.01,0.24053120613098145
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,2048,768,8,128,1,4,power_law_1.01,0.9318464279174805
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,2048,768,8,128,1,4,power_law_1.01,0.06825600266456604
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,2048,768,8,128,1,4,power_law_1.01,0.2869375944137573
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,2048,768,8,128,1,4,balanced,0.1713386575380961
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,2048,768,8,128,1,4,power_law_1.01,0.07293440103530884
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,2048,768,8,128,1,4,balanced,0.8845280011494955
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,2048,768,8,128,1,4,power_law_1.01,0.3985088109970093
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,2048,768,8,128,1,4,power_law_1.01,1.0924223899841308
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,2048,768,8,128,1,4,power_law_1.01,0.07324159741401673
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,2048,768,8,128,1,4,power_law_1.01,0.48757119178771974
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,2048,768,8,128,1,4,balanced,0.2513333360354106
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,2048,768,8,128,1,4,power_law_1.01,1.726585578918457
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,2048,768,8,128,1,4,power_law_1.01,0.07948799729347229
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,2048,768,8,128,1,4,power_law_1.01,0.08344320058822632
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,2048,768,8,128,1,4,power_law_1.01,0.7914432048797607
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,2048,768,8,128,1,4,power_law_1.01,3.1350528717041017
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,2048,768,8,128,1,4,power_law_1.01,0.08502399921417236
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,2048,768,8,128,1,4,power_law_1.01,0.8913984298706055
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,2048,768,8,128,1,4,balanced,0.31003199021021527
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,2048,768,8,128,1,4,power_law_1.01,0.09129599928855896
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,2048,768,8,128,1,4,power_law_1.01,1.023686408996582
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,2048,768,8,128,1,4,power_law_1.01,1.7793344497680663
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,2048,768,8,128,1,4,balanced,0.45347734292348224
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,2048,768,8,128,1,4,power_law_1.01,0.09820799827575684
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,2048,768,8,128,1,4,power_law_1.01,3.575328063964844
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,2048,768,8,128,1,4,power_law_1.01,0.10552959442138672
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,2048,768,8,128,1,4,power_law_1.01,0.10973440408706665
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,2048,768,8,128,1,4,balanced,0.5917919874191284
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,2048,768,8,128,1,4,power_law_1.2,0.04419200122356415
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,2048,768,8,128,1,4,power_law_1.01,0.13368959426879884
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,2048,768,8,128,1,4,power_law_1.2,0.03373439908027649
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,2048,768,8,128,1,4,balanced,1.3627360661824544
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,2048,768,8,128,1,4,power_law_1.01,0.14458240270614625
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,2048,768,8,128,1,4,power_law_1.2,0.039961600303649904
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,2048,768,8,128,1,4,power_law_1.01,0.2002880096435547
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,2048,768,8,128,1,4,power_law_1.2,0.051283198595047
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,2048,768,8,128,1,4,power_law_1.2,0.05927680134773254
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,2048,768,8,128,1,4,power_law_1.01,0.24114561080932617
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,2048,768,8,128,1,4,balanced,0.868506669998169
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,2048,768,8,128,1,4,power_law_1.2,0.08955519795417785
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,2048,768,8,128,1,4,power_law_1.01,0.3561728000640869
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,2048,768,8,128,1,4,balanced,2.5958239237467446
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,2048,768,8,128,1,4,power_law_1.2,0.09281280040740966
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,2048,768,8,128,1,4,power_law_1.01,0.48299517631530764
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,2048,768,8,128,1,4,power_law_1.2,0.09623680114746094
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,2048,768,8,128,1,4,power_law_1.01,0.5838399887084961
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,2048,768,8,128,1,4,power_law_1.2,0.09896320104598999
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,2048,768,8,128,1,4,power_law_1.01,0.7611775875091553
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,2048,768,8,128,1,4,power_law_1.2,0.10007679462432861
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,2048,768,8,128,1,4,power_law_1.2,0.10217599868774414
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,2048,768,8,128,1,4,power_law_1.01,1.1845503807067872
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,2048,768,8,128,1,4,power_law_1.2,0.1100160002708435
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,2048,768,8,128,1,4,balanced,1.1419359842936199
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,2048,768,8,128,1,4,power_law_1.01,1.5374272346496582
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,2048,768,8,128,1,4,power_law_1.2,0.10892800092697144
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,2048,768,8,128,1,4,power_law_1.01,1.9435455322265625
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,2048,768,8,128,1,4,power_law_1.2,0.1180351972579956
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,2048,768,8,128,1,4,power_law_1.2,0.12399359941482543
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,2048,768,8,128,1,4,power_law_1.01,3.06298885345459
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,2048,768,8,128,1,4,power_law_1.2,0.12995840311050416
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,2048,768,8,128,1,4,power_law_1.01,6.513855743408203
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,2048,768,8,128,1,4,power_law_1.2,0.13197439908981323
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,2048,768,8,128,1,4,power_law_1.2,0.1462656021118164
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,2048,768,8,128,1,4,power_law_1.2,0.1678272008895874
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,2048,768,8,128,1,4,balanced,1.4104906717936199
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,2048,768,8,128,1,4,power_law_1.2,0.19136639833450317
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,2048,768,8,128,1,4,power_law_1.2,0.2439039945602417
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,2048,768,8,128,1,4,power_law_1.2,0.29561600685119627
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,2048,768,8,128,1,4,power_law_1.2,0.30857601165771487
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,2048,768,8,128,1,4,power_law_1.2,0.4284351825714111
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,2048,768,8,128,1,4,balanced,2.6374826431274414
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,2048,768,8,128,1,4,power_law_1.2,0.6143807888031005
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,2048,768,8,128,1,4,power_law_1.2,0.8119808197021484
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,2048,768,8,128,1,4,power_law_1.2,0.9944512367248535
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,2048,768,8,128,1,4,power_law_1.2,1.2717568397521972
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,2048,768,8,128,1,4,power_law_1.2,2.205766487121582
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,2048,768,8,128,1,4,balanced,2.2291785875956216
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,2048,768,8,128,1,4,power_law_1.2,4.833369445800781
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,2048,768,8,128,1,4,power_law_1.2,0.03607679903507233
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,2048,768,8,128,1,4,power_law_1.2,0.03167999982833862
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,2048,768,8,128,1,4,power_law_1.2,0.0350271999835968
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,2048,768,8,128,1,4,power_law_1.2,0.043059200048446655
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,2048,768,8,128,1,4,power_law_1.2,0.05100160241127014
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,2048,768,8,128,1,4,power_law_1.2,0.06614400148391723
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,2048,768,8,128,1,4,power_law_1.2,0.06895999908447266
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,2048,768,8,128,1,4,power_law_1.2,0.06889600157737732
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,2048,768,8,128,1,4,power_law_1.2,0.07037439942359924
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,2048,768,8,128,1,4,power_law_1.2,0.07194240093231201
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,2048,768,8,128,1,4,power_law_1.2,0.07783039808273315
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,2048,768,8,128,1,4,power_law_1.2,0.08156160116195679
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,2048,768,8,128,1,4,power_law_1.2,0.08181120157241821
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,2048,768,8,128,1,4,power_law_1.2,0.08392320275306701
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,2048,768,8,128,1,4,power_law_1.2,0.09200000166893005
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,2048,768,8,128,1,4,power_law_1.2,0.09690880179405212
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,2048,768,8,128,1,4,power_law_1.2,0.09983360171318054
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,2048,768,8,128,1,4,power_law_1.2,0.11938560009002686
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,2048,768,8,128,1,4,power_law_1.2,0.12567039728164672
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,2048,768,8,128,1,4,power_law_1.2,0.15384960174560547
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,2048,768,8,128,1,4,balanced,4.409632047017415
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,2048,768,8,128,1,4,power_law_1.2,0.19035520553588867
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,2048,768,8,128,1,4,power_law_1.2,0.25594239234924315
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,2048,768,8,128,1,4,power_law_1.2,0.29424641132354734
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,2048,768,8,128,1,4,power_law_1.2,0.45418882369995117
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,2048,768,8,128,1,4,power_law_1.2,0.5328767776489258
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,2048,768,8,128,1,4,power_law_1.2,0.8091391563415528
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,2048,768,8,128,1,4,power_law_1.2,1.135155200958252
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,2048,768,8,128,1,4,power_law_1.2,1.537504005432129
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,2048,768,8,128,1,4,power_law_1.2,2.16232967376709
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,2048,768,8,128,1,4,power_law_1.2,4.651283264160156
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,2048,768,8,128,2,2,balanced,0.02717866748571396
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,2048,768,8,128,2,2,balanced,0.032074667513370514
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,2048,768,8,128,2,2,balanced,0.04366933306058248
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,2048,768,8,128,2,2,balanced,0.06320533156394958
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,2048,768,8,128,2,2,balanced,0.10168000062306722
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,2048,768,8,128,1,4,power_law_1.2,0.03330560028553009
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,2048,768,8,128,2,2,balanced,0.10107733805974324
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,2048,768,8,128,1,4,power_law_1.2,0.03442560136318207
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,2048,768,8,128,2,2,balanced,0.10101333260536194
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,2048,768,8,128,1,4,power_law_1.2,0.0353408008813858
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,2048,768,8,128,2,2,balanced,0.1002293328444163
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,2048,768,8,128,1,4,power_law_1.2,0.043833601474761966
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,2048,768,8,128,2,2,balanced,0.10168533523877461
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,2048,768,8,128,1,4,power_law_1.2,0.05065600275993347
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,2048,768,8,128,2,2,balanced,0.10258666674296062
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,2048,768,8,128,1,4,power_law_1.2,0.06639360189437866
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,2048,768,8,128,2,2,balanced,0.10381333033243816
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,2048,768,8,128,1,4,power_law_1.2,0.06791679859161377
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,2048,768,8,128,2,2,balanced,0.10592533151308696
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,2048,768,8,128,1,4,power_law_1.2,0.07109760046005249
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,2048,768,8,128,2,2,balanced,0.03352533280849457
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,2048,768,8,128,2,2,balanced,0.10674132903416951
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,2048,768,8,128,1,4,power_law_1.2,0.07246720194816589
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,2048,768,8,128,2,2,balanced,0.1090826690196991
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,2048,768,8,128,2,2,balanced,0.03294933338960012
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,2048,768,8,128,1,4,power_law_1.2,0.07427840232849121
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,2048,768,8,128,2,2,balanced,0.11966933806737264
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,2048,768,8,128,2,2,balanced,0.036117332677046456
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,2048,768,8,128,1,4,power_law_1.2,0.07815679907798767
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,2048,768,8,128,2,2,balanced,0.12211733063062032
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,2048,768,8,128,2,2,balanced,0.05411200225353241
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,2048,768,8,128,1,4,power_law_1.2,0.08343039751052857
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,2048,768,8,128,2,2,balanced,0.1297813355922699
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,2048,768,8,128,2,2,balanced,0.07452266911665599
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,2048,768,8,128,1,4,power_law_1.2,0.08533120155334473
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,2048,768,8,128,2,2,balanced,0.07633600135644276
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,2048,768,8,128,2,2,balanced,0.1397813359896342
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,2048,768,8,128,1,4,power_law_1.2,0.09502080082893372
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,2048,768,8,128,2,2,balanced,0.07738666733105977
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,2048,768,8,128,2,2,balanced,0.15095466375350952
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,2048,768,8,128,2,2,balanced,0.07593599955240886
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,2048,768,8,128,2,2,balanced,0.07766399780909221
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,2048,768,8,128,2,2,balanced,0.16966400543848673
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,2048,768,8,128,1,4,power_law_1.2,0.10383360385894776
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,2048,768,8,128,2,2,balanced,0.0782293329636256
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,2048,768,8,128,1,4,power_law_1.2,0.10829440355300904
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,2048,768,8,128,2,2,balanced,0.18629332383473715
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,2048,768,8,128,2,2,balanced,0.07903466622034709
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,2048,768,8,128,2,2,balanced,0.08158400158087413
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,2048,768,8,128,1,4,power_law_1.2,0.1161471962928772
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,2048,768,8,128,2,2,balanced,0.24660799900690714
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,2048,768,8,128,2,2,balanced,0.041306667029857635
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,2048,768,8,128,2,2,balanced,0.0823413332303365
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,2048,768,8,128,1,4,power_law_1.2,0.12716799974441528
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,2048,768,8,128,2,2,balanced,0.08547199765841167
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,2048,768,8,128,2,2,balanced,0.0421066681543986
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,2048,768,8,128,2,2,power_law_1.01,0.030534398555755616
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,2048,768,8,128,1,4,power_law_1.2,0.15754239559173583
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,2048,768,8,128,2,2,balanced,0.09238933523495992
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,2048,768,8,128,2,2,balanced,0.04516266783078512
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,2048,768,8,128,2,2,balanced,0.2752959926923116
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,2048,768,8,128,2,2,power_law_1.01,0.034297600388526917
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,2048,768,8,128,1,4,power_law_1.2,0.1970944046974182
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,2048,768,8,128,2,2,balanced,0.09366933504740398
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,2048,768,8,128,2,2,balanced,0.057536001006762184
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,2048,768,8,128,2,2,power_law_1.01,0.038975998759269714
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,2048,768,8,128,1,4,power_law_1.2,0.23306879997253419
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,2048,768,8,128,2,2,power_law_1.01,0.05125759840011597
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,2048,768,8,128,2,2,balanced,0.0783679982026418
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,2048,768,8,128,2,2,balanced,0.10268266995747884
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,2048,768,8,128,2,2,power_law_1.01,0.06039040088653565
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,2048,768,8,128,1,4,power_law_1.2,0.40073599815368655
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,2048,768,8,128,2,2,balanced,0.39585598309834796
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,2048,768,8,128,2,2,balanced,0.08069866895675659
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,2048,768,8,128,2,2,power_law_1.01,0.09214079976081849
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,2048,768,8,128,2,2,balanced,0.11692800124486287
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,2048,768,8,128,1,4,power_law_1.2,0.4811135768890381
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,2048,768,8,128,2,2,power_law_1.01,0.09416319727897644
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,2048,768,8,128,2,2,balanced,0.08140266438325246
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,2048,768,8,128,2,2,power_law_1.01,0.0939903974533081
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,2048,768,8,128,2,2,balanced,0.12743999560674033
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,2048,768,8,128,2,2,balanced,0.0822026679913203
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,2048,768,8,128,1,4,power_law_1.2,0.7101247787475586
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,2048,768,8,128,2,2,power_law_1.01,0.09895039796829223
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,2048,768,8,128,2,2,power_law_1.01,0.1023360013961792
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,2048,768,8,128,2,2,balanced,0.08378666639328003
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,2048,768,8,128,2,2,balanced,0.15043733517328897
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,2048,768,8,128,1,4,power_law_1.2,0.8855232238769531
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,2048,768,8,128,2,2,power_law_1.01,0.10559359788894654
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,2048,768,8,128,2,2,balanced,0.4984746774037679
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,2048,768,8,128,2,2,power_law_1.01,0.034720000624656674
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,2048,768,8,128,2,2,balanced,0.08603200316429138
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,2048,768,8,128,2,2,power_law_1.01,0.11036159992218017
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,2048,768,8,128,1,4,power_law_1.2,1.2205183982849122
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,2048,768,8,128,2,2,balanced,0.17023466030756632
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,2048,768,8,128,2,2,power_law_1.01,0.11336959600448608
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,2048,768,8,128,2,2,balanced,0.088319996992747
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,2048,768,8,128,2,2,power_law_1.01,0.03307519853115082
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,2048,768,8,128,2,2,power_law_1.01,0.11910400390625
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,2048,768,8,128,1,4,power_law_1.2,1.8004928588867188
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,2048,768,8,128,2,2,balanced,0.09083732962608337
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,2048,768,8,128,2,2,power_law_1.01,0.12380800247192383
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,2048,768,8,128,2,2,power_law_1.01,0.03697279989719391
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,2048,768,8,128,2,2,power_law_1.01,0.13232640027999878
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,2048,768,8,128,2,2,balanced,0.2385866641998291
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,2048,768,8,128,1,4,power_law_1.2,2.354105567932129
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,2048,768,8,128,2,2,balanced,0.09352533022562663
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,2048,768,8,128,2,2,power_law_1.01,0.04657920002937317
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,2048,768,8,128,2,2,power_law_1.01,0.1354688048362732
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,2048,768,8,128,2,2,balanced,0.09742400050163269
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,2048,768,8,128,2,2,power_law_1.01,0.1527232050895691
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,2048,768,8,128,2,2,power_law_1.01,0.05264639854431152
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,2048,768,8,128,2,2,balanced,0.7365333239237467
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,2048,768,8,128,1,4,power_law_1.2,4.399897766113281
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,2048,768,8,128,2,2,power_law_1.01,0.16691839694976807
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,2048,768,8,128,2,2,balanced,0.2776533365249634
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,2048,768,8,128,2,2,power_law_1.01,0.06840320229530335
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,2048,768,8,128,2,2,power_law_1.01,0.1994815945625305
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,2048,768,8,128,1,4,power_law_1.2,8.110829162597657
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,2048,768,8,128,2,2,power_law_1.01,0.07078400254249573
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,2048,768,8,128,2,2,power_law_1.01,0.24638719558715821
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,2048,768,8,128,2,2,power_law_1.01,0.3065023899078369
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,2048,768,8,128,2,2,power_law_1.01,0.07082880139350892
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,2048,768,8,128,2,2,balanced,0.10875200231870015
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,2048,768,8,128,2,2,power_law_1.01,0.3277055978775024
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,2048,768,8,128,2,2,power_law_1.01,0.07552639842033386
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,2048,768,8,128,2,2,balanced,0.4061439832051595
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,2048,768,8,128,2,2,power_law_1.01,0.4584640026092529
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,2048,768,8,128,2,2,balanced,0.1092800001303355
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,2048,768,8,128,2,2,power_law_1.01,0.0762943983078003
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,2048,768,8,128,2,2,power_law_1.01,0.5712063789367676
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,2048,768,8,128,2,2,power_law_1.01,0.08078719973564148
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,2048,768,8,128,2,2,power_law_1.01,0.8354751586914062
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,2048,768,8,128,2,2,balanced,0.9634559949239095
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,2048,768,8,128,2,2,power_law_1.01,0.9970623970031738
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,2048,768,8,128,2,2,power_law_1.01,0.08536319732666016
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,2048,768,8,128,2,2,power_law_1.01,1.2816767692565918
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,2048,768,8,128,2,2,power_law_1.01,0.08794879913330078
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,2048,768,8,128,2,2,balanced,0.5301173528035482
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,2048,768,8,128,2,2,power_law_1.01,2.097203254699707
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,2048,768,8,128,2,2,power_law_1.01,0.09056000113487243
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,2048,768,8,128,2,2,balanced,0.1285760005315145
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,2048,768,8,128,2,2,power_law_1.01,0.09975680112838745
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,2048,768,8,128,2,2,power_law_1.01,4.504819107055664
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,2048,768,8,128,2,2,power_law_1.01,0.10253440141677857
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,2048,768,8,128,2,2,balanced,0.1516853372255961
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,2048,768,8,128,2,2,power_law_1.01,0.11221120357513428
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,2048,768,8,128,2,2,balanced,0.1609599987665812
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,2048,768,8,128,2,2,power_law_1.01,0.1332352042198181
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,2048,768,8,128,2,2,balanced,0.7880746523539225
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,2048,768,8,128,2,2,balanced,0.21711466709772745
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,2048,768,8,128,2,2,power_law_1.01,0.14294400215148925
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,2048,768,8,128,2,2,balanced,1.1979573567708333
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,2048,768,8,128,2,2,power_law_1.01,0.17534719705581664
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,2048,768,8,128,2,2,balanced,0.2645919919013977
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,2048,768,8,128,2,2,power_law_1.01,0.20942718982696534
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,2048,768,8,128,2,2,power_law_1.01,0.2773184061050415
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,2048,768,8,128,2,2,power_law_1.01,0.3348479986190796
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,2048,768,8,128,2,2,balanced,0.40086400508880615
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,2048,768,8,128,2,2,power_law_1.01,0.47217278480529784
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,2048,768,8,128,2,2,power_law_1.01,0.5869184017181397
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,2048,768,8,128,2,2,balanced,1.0425386428833008
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,2048,768,8,128,2,2,power_law_1.01,0.8398528099060059
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,2048,768,8,128,2,2,balanced,0.48398399353027344
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,2048,768,8,128,2,2,power_law_1.01,1.0595775604248048
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,2048,768,8,128,2,2,power_law_1.01,1.464179229736328
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,2048,768,8,128,2,2,balanced,0.6987360318501791
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,2048,768,8,128,2,2,power_law_1.01,0.03874559998512268
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,2048,768,8,128,2,2,power_law_1.01,2.266399955749512
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,2048,768,8,128,2,2,power_law_1.01,0.04314239919185638
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,2048,768,8,128,2,2,power_law_1.01,4.550233459472656
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,2048,768,8,128,2,2,power_law_1.01,0.046163201332092285
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,2048,768,8,128,2,2,balanced,1.8806026776631672
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,2048,768,8,128,2,2,power_law_1.01,0.053472000360488894
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,2048,768,8,128,2,2,balanced,0.9205386638641357
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,2048,768,8,128,2,2,power_law_1.01,0.060864001512527466
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,2048,768,8,128,2,2,balanced,1.2902452945709229
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,2048,768,8,128,2,2,power_law_1.2,0.030079999566078187
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,2048,768,8,128,2,2,power_law_1.01,0.07440000176429748
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,2048,768,8,128,2,2,power_law_1.2,0.03229439854621887
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,2048,768,8,128,2,2,power_law_1.01,0.07760000228881836
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,2048,768,8,128,2,2,power_law_1.2,0.037171199917793274
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,2048,768,8,128,2,2,power_law_1.01,0.07785599827766418
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,2048,768,8,128,2,2,power_law_1.2,0.04930559992790222
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,2048,768,8,128,2,2,power_law_1.01,0.08339840173721313
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,2048,768,8,128,2,2,balanced,1.356485366821289
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,2048,768,8,128,2,2,power_law_1.2,0.057030397653579715
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,2048,768,8,128,2,2,power_law_1.01,0.08718720078468323
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,2048,768,8,128,2,2,power_law_1.2,0.08961920142173767
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,2048,768,8,128,2,2,power_law_1.01,0.09191679954528809
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,2048,768,8,128,2,2,power_law_1.01,0.09604480266571044
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,2048,768,8,128,2,2,power_law_1.2,0.0946175992488861
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,2048,768,8,128,2,2,power_law_1.01,0.10149120092391968
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,2048,768,8,128,2,2,power_law_1.2,0.09731839895248413
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,2048,768,8,128,2,2,power_law_1.01,0.11119999885559081
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,2048,768,8,128,2,2,power_law_1.2,0.09975039958953857
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,2048,768,8,128,2,2,power_law_1.2,0.09749119877815246
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,2048,768,8,128,2,2,balanced,1.7844533920288086
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,2048,768,8,128,2,2,power_law_1.01,0.1194815993309021
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,2048,768,8,128,2,2,power_law_1.2,0.10483839511871337
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,2048,768,8,128,2,2,balanced,2.0521225929260254
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,2048,768,8,128,2,2,power_law_1.01,0.1260543942451477
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,2048,768,8,128,2,2,power_law_1.2,0.11117440462112427
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,2048,768,8,128,2,2,power_law_1.2,0.11450879573822022
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,2048,768,8,128,2,2,power_law_1.01,0.13640960454940795
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,2048,768,8,128,2,2,power_law_1.2,0.11630079746246338
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,2048,768,8,128,2,2,power_law_1.2,0.12773760557174682
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,2048,768,8,128,2,2,power_law_1.01,0.16671359539031982
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,2048,768,8,128,2,2,power_law_1.2,0.13435519933700563
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,2048,768,8,128,2,2,power_law_1.01,0.18959360122680663
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,2048,768,8,128,2,2,power_law_1.2,0.14142719507217408
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,2048,768,8,128,2,2,power_law_1.01,0.260697603225708
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,2048,768,8,128,2,2,power_law_1.2,0.16188160181045533
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,2048,768,8,128,2,2,power_law_1.01,0.3304768085479736
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,2048,768,8,128,2,2,balanced,2.208346684773763
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,2048,768,8,128,2,2,power_law_1.2,0.17675520181655885
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,2048,768,8,128,2,2,power_law_1.01,0.4352384090423584
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,2048,768,8,128,2,2,power_law_1.2,0.20451838970184327
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,2048,768,8,128,2,2,balanced,3.6081279118855796
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,2048,768,8,128,2,2,power_law_1.01,0.5266816139221191
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,2048,768,8,128,2,2,power_law_1.2,0.2603775978088379
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,2048,768,8,128,2,2,power_law_1.01,0.8172160148620605
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,2048,768,8,128,2,2,power_law_1.2,0.3125056028366089
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,2048,768,8,128,2,2,power_law_1.01,1.00131196975708
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,2048,768,8,128,2,2,power_law_1.2,0.3567744016647339
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,2048,768,8,128,2,2,power_law_1.01,1.5337920188903809
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,2048,768,8,128,2,2,power_law_1.2,0.4442624092102051
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,2048,768,8,128,2,2,power_law_1.01,2.0078336715698244
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,2048,768,8,128,2,2,power_law_1.2,0.605625581741333
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,2048,768,8,128,2,2,power_law_1.01,2.5756607055664062
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,2048,768,8,128,2,2,power_law_1.2,0.903775978088379
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,2048,768,8,128,2,2,power_law_1.01,4.091635131835938
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,2048,768,8,128,2,2,power_law_1.2,1.1381952285766601
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,2048,768,8,128,2,2,power_law_1.01,7.985964965820313
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,2048,768,8,128,2,2,power_law_1.2,1.4329919815063477
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,2048,768,8,128,2,2,balanced,3.4843467076619468
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,2048,768,8,128,2,2,power_law_1.2,2.2412288665771483
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,2048,768,8,128,2,2,power_law_1.2,4.5194751739501955
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,2048,768,8,128,2,2,balanced,3.9643894831339517
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,2048,768,8,128,2,2,power_law_1.2,0.03477759957313538
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,2048,768,8,128,2,2,power_law_1.2,0.0324288010597229
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,2048,768,8,128,2,2,power_law_1.2,0.03594880104064942
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,2048,768,8,128,2,2,power_law_1.2,0.0434112012386322
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,2048,768,8,128,2,2,power_law_1.2,0.05080320239067078
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,2048,768,8,128,2,2,power_law_1.2,0.0709824025630951
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,2048,768,8,128,2,2,power_law_1.2,0.07061759829521179
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,2048,768,8,128,2,2,power_law_1.2,0.07415040135383606
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,2048,768,8,128,2,2,balanced,6.886869430541992
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,2048,768,8,128,2,2,power_law_1.2,0.0754688024520874
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,2048,768,8,128,2,2,power_law_1.2,0.07774080038070678
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,2048,768,8,128,2,2,power_law_1.2,0.08215680122375488
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,2048,768,8,128,2,2,power_law_1.2,0.03874559998512268
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,2048,768,8,128,2,2,power_law_1.2,0.08593279719352723
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,2048,768,8,128,2,2,power_law_1.2,0.04232319891452789
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,2048,768,8,128,2,2,power_law_1.2,0.04472320079803467
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,2048,768,8,128,2,2,power_law_1.2,0.08906880021095276
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,2048,768,8,128,2,2,power_law_1.2,0.05009920001029968
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,2048,768,8,128,2,2,power_law_1.2,0.09004160165786743
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,2048,768,8,128,2,2,power_law_1.2,0.05728639960289002
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,2048,768,8,128,2,2,power_law_1.2,0.07473919987678528
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,2048,768,8,128,2,2,power_law_1.2,0.0998080015182495
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,2048,768,8,128,2,2,power_law_1.2,0.07916799783706666
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,2048,768,8,128,2,2,power_law_1.2,0.10700160264968872
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,2048,768,8,128,2,2,power_law_1.2,0.08116480112075805
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,2048,768,8,128,2,2,power_law_1.2,0.08522239923477173
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,2048,768,8,128,2,2,power_law_1.2,0.08759040236473084
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,2048,768,8,128,2,2,power_law_1.2,0.11455999612808228
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,2048,768,8,128,4,1,balanced,0.03049066662788391
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,2048,768,8,128,2,2,power_law_1.2,0.091430401802063
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,2048,768,8,128,2,2,power_law_1.2,0.1369920015335083
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,2048,768,8,128,2,2,power_law_1.2,0.10122879743576049
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,2048,768,8,128,4,1,balanced,0.03474666674931844
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,2048,768,8,128,2,2,power_law_1.2,0.1
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,2048,768,8,128,2,2,power_law_1.2,0.14646400213241578
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,2048,768,8,128,4,1,balanced,0.04563733438650767
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,2048,768,8,128,2,2,power_law_1.2,0.11269760131835938
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,2048,768,8,128,2,2,power_law_1.2,0.17623039484024047
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,2048,768,8,128,4,1,balanced,0.0672266681989034
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,2048,768,8,128,2,2,power_law_1.2,0.20591359138488768
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,2048,768,8,128,4,1,balanced,0.1095306674639384
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,2048,768,8,128,2,2,power_law_1.2,0.2796607971191406
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,2048,768,8,128,4,1,balanced,0.11013333002726237
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,2048,768,8,128,2,2,power_law_1.2,0.12392319440841675
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,2048,768,8,128,4,1,balanced,0.10977600018183391
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,2048,768,8,128,2,2,power_law_1.2,0.34461441040039065
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,2048,768,8,128,2,2,power_law_1.2,0.13550080060958863
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,2048,768,8,128,4,1,balanced,0.11071466406186421
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,2048,768,8,128,2,2,power_law_1.2,0.48757758140563967
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,2048,768,8,128,4,1,balanced,0.11115733782450359
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,2048,768,8,128,4,1,balanced,0.1133013367652893
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,2048,768,8,128,2,2,power_law_1.2,0.6661888122558594
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,2048,768,8,128,4,1,balanced,0.11337066690127055
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,2048,768,8,128,2,2,power_law_1.2,0.13944319486618043
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,2048,768,8,128,2,2,power_law_1.2,0.9157376289367676
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,2048,768,8,128,4,1,balanced,0.11685333649317424
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,2048,768,8,128,2,2,power_law_1.2,0.16858240365982055
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,2048,768,8,128,4,1,balanced,0.1185706655184428
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,2048,768,8,128,2,2,power_law_1.2,0.201363205909729
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,2048,768,8,128,2,2,power_law_1.2,1.1738816261291505
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,2048,768,8,128,4,1,balanced,0.12146666646003723
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,2048,768,8,128,2,2,power_law_1.2,0.26753280162811277
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,2048,768,8,128,2,2,power_law_1.2,1.4942144393920898
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,2048,768,8,128,4,1,balanced,0.13275733590126038
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,2048,768,8,128,2,2,power_law_1.2,0.336409592628479
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,2048,768,8,128,4,1,balanced,0.1376479963461558
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,2048,768,8,128,2,2,power_law_1.2,2.5483776092529298
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,2048,768,8,128,2,2,power_law_1.2,0.4602047920227051
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,2048,768,8,128,4,1,balanced,0.1507200002670288
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,2048,768,8,128,2,2,power_law_1.2,0.6040128231048584
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,2048,768,8,128,2,2,power_law_1.2,5.118035125732422
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,2048,768,8,128,2,2,power_law_1.2,0.8490559577941894
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,2048,768,8,128,4,1,balanced,0.17271999518076578
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,2048,768,8,128,2,2,power_law_1.2,1.0390080451965331
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,2048,768,8,128,4,1,balanced,0.1853760083516439
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,2048,768,8,128,2,2,power_law_1.2,1.5222911834716797
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,2048,768,8,128,4,1,balanced,0.21379733085632324
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,2048,768,8,128,2,2,power_law_1.2,2.0799232482910157
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,2048,768,8,128,2,2,power_law_1.2,2.6620223999023436
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,2048,768,8,128,4,1,balanced,0.23324799537658691
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,2048,768,8,128,2,2,power_law_1.2,4.169689559936524
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,2048,768,8,128,4,1,balanced,0.34884798526763916
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,2048,768,8,128,2,2,power_law_1.2,9.103257751464843
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,2048,768,8,128,4,1,balanced,0.38628800710042316
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,2048,768,8,128,4,1,balanced,0.5802773237228394
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,2048,768,8,128,4,1,balanced,0.03692266593376795
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,2048,768,8,128,4,1,balanced,0.03622400015592575
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,2048,768,8,128,4,1,balanced,0.04186666508515676
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,2048,768,8,128,4,1,balanced,0.06065600117047628
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,2048,768,8,128,4,1,balanced,0.7511413097381592
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,2048,768,8,128,4,1,balanced,0.08599467078844707
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,2048,768,8,128,4,1,balanced,0.08741866548856099
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,2048,768,8,128,4,1,balanced,0.08777067065238953
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,2048,768,8,128,4,1,balanced,0.08869866530100505
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,2048,768,8,128,4,1,balanced,0.09054399530092876
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,2048,768,8,128,4,1,balanced,1.147877295811971
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,2048,768,8,128,4,1,balanced,0.09117333094278972
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,2048,768,8,128,4,1,balanced,0.0934986670811971
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,2048,768,8,128,4,1,balanced,0.09722666939099629
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,2048,768,8,128,4,1,balanced,0.10034132997194926
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,2048,768,8,128,4,1,balanced,0.10611733794212341
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,2048,768,8,128,4,1,balanced,0.1129866639773051
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,2048,768,8,128,4,1,balanced,0.06080000102519989
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,2048,768,8,128,4,1,balanced,0.11838933825492859
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,2048,768,8,128,4,1,balanced,1.4754667282104492
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,2048,768,8,128,4,1,balanced,0.06471466521422069
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,2048,768,8,128,4,1,balanced,0.1364959975083669
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,2048,768,8,128,4,1,balanced,0.06637866795063019
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,2048,768,8,128,4,1,balanced,0.08011733492215474
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,2048,768,8,128,4,1,balanced,0.15898133317629495
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,2048,768,8,128,4,1,power_law_1.01,0.02844800055027008
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,2048,768,8,128,4,1,balanced,0.10262399911880493
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,2048,768,8,128,4,1,power_law_1.01,0.03444480001926422
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,2048,768,8,128,4,1,balanced,0.17473065853118896
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,2048,768,8,128,4,1,balanced,0.10599999626477559
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,2048,768,8,128,4,1,power_law_1.01,0.033471998572349546
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,2048,768,8,128,4,1,power_law_1.01,0.03459199965000152
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,2048,768,8,128,4,1,balanced,0.10779199997584026
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,2048,768,8,128,4,1,balanced,0.21416000525156656
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,2048,768,8,128,4,1,power_law_1.01,0.04076800048351288
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,2048,768,8,128,4,1,power_law_1.01,0.037920001149177554
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,2048,768,8,128,4,1,balanced,0.10949333508809407
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,2048,768,8,128,4,1,balanced,0.11217600107192993
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,2048,768,8,128,4,1,power_law_1.01,0.04904319941997528
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,2048,768,8,128,4,1,power_law_1.01,0.05453439950942993
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,2048,768,8,128,4,1,balanced,0.25044800837834674
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,2048,768,8,128,4,1,balanced,0.11520000298817952
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,2048,768,8,128,4,1,power_law_1.01,0.05716480016708374
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,2048,768,8,128,4,1,power_law_1.01,0.06362239718437195
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,2048,768,8,128,4,1,balanced,1.835210641225179
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,2048,768,8,128,4,1,balanced,0.11884267131487529
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,2048,768,8,128,4,1,power_law_1.01,0.07633280158042907
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,2048,768,8,128,4,1,power_law_1.01,0.09844480156898498
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,2048,768,8,128,4,1,balanced,0.371616005897522
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,2048,768,8,128,4,1,balanced,0.12469866871833801
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,2048,768,8,128,4,1,power_law_1.01,0.07954559922218322
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,2048,768,8,128,4,1,power_law_1.01,0.10058239698410035
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,2048,768,8,128,4,1,balanced,0.1304266651471456
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,2048,768,8,128,4,1,power_law_1.01,0.0812608003616333
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,2048,768,8,128,4,1,power_law_1.01,0.10497920513153076
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,2048,768,8,128,4,1,balanced,0.4498720169067383
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,2048,768,8,128,4,1,balanced,0.13436800241470337
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,2048,768,8,128,4,1,power_law_1.01,0.0863103985786438
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,2048,768,8,128,4,1,power_law_1.01,0.10947200059890747
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,2048,768,8,128,4,1,power_law_1.01,0.09034879803657532
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,2048,768,8,128,4,1,power_law_1.01,0.10995839834213257
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,2048,768,8,128,4,1,power_law_1.01,0.09580159783363343
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,2048,768,8,128,4,1,power_law_1.01,0.11829119920730591
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,2048,768,8,128,4,1,power_law_1.01,0.10085120201110839
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,2048,768,8,128,4,1,balanced,0.6532053152720133
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,2048,768,8,128,4,1,balanced,0.155349334081014
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,2048,768,8,128,4,1,power_law_1.01,0.12165759801864624
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,2048,768,8,128,4,1,power_law_1.01,0.10712319612503052
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,2048,768,8,128,4,1,balanced,0.1585706671079
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,2048,768,8,128,4,1,power_law_1.01,0.12803839445114135
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,2048,768,8,128,4,1,power_law_1.01,0.11096960306167603
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,2048,768,8,128,4,1,power_law_1.01,0.11832319498062134
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,2048,768,8,128,4,1,power_law_1.01,0.12999680042266845
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,2048,768,8,128,4,1,balanced,0.8612426916758219
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,2048,768,8,128,4,1,power_law_1.01,0.12825599908828736
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,2048,768,8,128,4,1,power_law_1.01,0.1369279980659485
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,2048,768,8,128,4,1,power_law_1.01,0.14257279634475709
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,2048,768,8,128,4,1,power_law_1.01,0.15082240104675293
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,2048,768,8,128,4,1,balanced,2.986421267191569
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,2048,768,8,128,4,1,power_law_1.01,0.17215360403060914
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,2048,768,8,128,4,1,power_law_1.01,0.15914880037307738
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,2048,768,8,128,4,1,balanced,0.1881386637687683
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,2048,768,8,128,4,1,power_law_1.01,0.19051519632339478
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,2048,768,8,128,4,1,power_law_1.01,0.19376640319824218
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,2048,768,8,128,4,1,balanced,0.23269865910212198
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,2048,768,8,128,4,1,power_law_1.01,0.23878400325775145
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,2048,768,8,128,4,1,power_law_1.01,0.20519039630889893
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,2048,768,8,128,4,1,power_law_1.01,0.28536319732666016
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,2048,768,8,128,4,1,power_law_1.01,0.052313601970672606
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,2048,768,8,128,4,1,balanced,0.2635466655095418
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,2048,768,8,128,4,1,balanced,1.328501303990682
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,2048,768,8,128,4,1,power_law_1.01,0.2472127914428711
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,2048,768,8,128,4,1,power_law_1.01,0.3840831995010376
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,2048,768,8,128,4,1,power_law_1.01,0.06198400259017944
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,2048,768,8,128,4,1,balanced,0.38202134768168133
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,2048,768,8,128,4,1,power_law_1.01,0.2791615962982178
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,2048,768,8,128,4,1,power_law_1.01,0.48112640380859373
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,2048,768,8,128,4,1,power_law_1.01,0.06543359756469727
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,2048,768,8,128,4,1,power_law_1.01,0.3716415882110596
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,2048,768,8,128,4,1,power_law_1.01,0.6876160144805908
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,2048,768,8,128,4,1,balanced,0.44994668165842694
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,2048,768,8,128,4,1,power_law_1.01,0.0741375982761383
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,2048,768,8,128,4,1,power_law_1.01,0.8889663696289063
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,2048,768,8,128,4,1,power_law_1.01,0.44992637634277344
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,2048,768,8,128,4,1,power_law_1.01,0.0800704002380371
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,2048,768,8,128,4,1,power_law_1.01,1.3034560203552246
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,2048,768,8,128,4,1,power_law_1.01,0.6203135967254638
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,2048,768,8,128,4,1,power_law_1.01,0.09694719910621644
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,2048,768,8,128,4,1,balanced,0.6797973314921061
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,2048,768,8,128,4,1,power_law_1.01,0.7893184185028076
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,2048,768,8,128,4,1,power_law_1.01,1.7126783370971679
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,2048,768,8,128,4,1,power_law_1.01,0.09926400184631348
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,2048,768,8,128,4,1,balanced,1.7818719546000164
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,2048,768,8,128,4,1,power_law_1.01,0.10213760137557984
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,2048,768,8,128,4,1,power_law_1.01,1.1314559936523438
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,2048,768,8,128,4,1,power_law_1.01,2.1398527145385744
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,2048,768,8,128,4,1,balanced,0.8272480169932047
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,2048,768,8,128,4,1,power_law_1.01,0.11052160263061524
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,2048,768,8,128,4,1,power_law_1.01,1.44717435836792
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,2048,768,8,128,4,1,power_law_1.01,3.421343994140625
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,2048,768,8,128,4,1,power_law_1.01,0.11292799711227416
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,2048,768,8,128,4,1,power_law_1.01,1.791801643371582
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,2048,768,8,128,4,1,power_law_1.01,0.12166399955749511
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,2048,768,8,128,4,1,power_law_1.01,6.8977409362792965
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,2048,768,8,128,4,1,balanced,1.2074133555094402
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,2048,768,8,128,4,1,power_law_1.01,0.13086719512939454
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,2048,768,8,128,4,1,power_law_1.01,2.8996608734130858
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,2048,768,8,128,4,1,power_law_1.01,0.13899519443511962
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,2048,768,8,128,4,1,power_law_1.01,0.15379199981689454
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,2048,768,8,128,4,1,power_law_1.01,6.045708847045899
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,2048,768,8,128,4,1,balanced,1.5863787333170574
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,2048,768,8,128,4,1,balanced,2.2101707458496094
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,2048,768,8,128,4,1,power_law_1.01,0.1674496054649353
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,2048,768,8,128,4,1,power_law_1.01,0.17947520017623902
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,2048,768,8,128,4,1,power_law_1.2,0.028595200181007384
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,2048,768,8,128,4,1,power_law_1.01,0.19003520011901856
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,2048,768,8,128,4,1,balanced,5.857290903727214
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,2048,768,8,128,4,1,balanced,2.346106688181559
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,2048,768,8,128,4,1,power_law_1.2,0.03387520015239716
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,2048,768,8,128,4,1,power_law_1.01,0.23763198852539064
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,2048,768,8,128,4,1,power_law_1.2,0.03834240138530731
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,2048,768,8,128,4,1,power_law_1.01,0.2920383930206299
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,2048,768,8,128,4,1,power_law_1.2,0.049184000492095946
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,2048,768,8,128,4,1,power_law_1.01,0.4048319816589355
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,2048,768,8,128,4,1,power_law_1.2,0.06257920265197754
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,2048,768,8,128,4,1,power_law_1.01,0.49488000869750975
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,2048,768,8,128,4,1,power_law_1.2,0.09660159945487976
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,2048,768,8,128,4,1,power_law_1.01,0.6796544075012207
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,2048,768,8,128,4,1,power_law_1.2,0.0351936012506485
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,2048,768,8,128,4,1,power_law_1.01,0.863430404663086
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,2048,768,8,128,4,1,power_law_1.2,0.10448000431060792
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,2048,768,8,128,4,1,balanced,3.104506810506185
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,2048,768,8,128,4,1,power_law_1.2,0.035769599676132205
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,2048,768,8,128,4,1,power_law_1.01,1.2420479774475097
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,2048,768,8,128,4,1,balanced,3.542069435119629
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,2048,768,8,128,4,1,power_law_1.2,0.038431999087333676
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,2048,768,8,128,4,1,power_law_1.2,0.10910719633102417
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,2048,768,8,128,4,1,power_law_1.01,1.6232128143310547
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,2048,768,8,128,4,1,power_law_1.2,0.04732159972190857
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,2048,768,8,128,4,1,power_law_1.2,0.11068799495697021
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,2048,768,8,128,4,1,power_law_1.2,0.054688000679016115
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,2048,768,8,128,4,1,power_law_1.2,0.11282559633255004
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,2048,768,8,128,4,1,power_law_1.01,2.378803253173828
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,2048,768,8,128,4,1,power_law_1.2,0.07672320008277893
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,2048,768,8,128,4,1,power_law_1.2,0.1195072054862976
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,2048,768,8,128,4,1,power_law_1.01,3.131097602844238
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,2048,768,8,128,4,1,power_law_1.2,0.0825984001159668
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,2048,768,8,128,4,1,power_law_1.2,0.12479360103607177
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,2048,768,8,128,4,1,power_law_1.01,3.8806079864501952
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,2048,768,8,128,4,1,power_law_1.2,0.08387200236320495
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,2048,768,8,128,4,1,power_law_1.2,0.12851840257644653
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,2048,768,8,128,4,1,power_law_1.2,0.08892800211906433
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,2048,768,8,128,4,1,power_law_1.01,6.127398300170898
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,2048,768,8,128,4,1,balanced,3.8428319295247397
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,2048,768,8,128,4,1,power_law_1.2,0.12900480031967163
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,2048,768,8,128,4,1,power_law_1.2,0.09345920085906982
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,2048,768,8,128,4,1,power_law_1.2,0.13849600553512573
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,2048,768,8,128,4,1,power_law_1.2,0.09654399752616882
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,2048,768,8,128,4,1,power_law_1.01,12.159839630126953
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,2048,768,8,128,4,1,power_law_1.2,0.14753279685974122
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,2048,768,8,128,4,1,power_law_1.2,0.10396159887313842
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,2048,768,8,128,4,1,power_law_1.2,0.1652351975440979
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,2048,768,8,128,4,1,power_law_1.2,0.11029119491577148
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,2048,768,8,128,4,1,power_law_1.2,0.1931071996688843
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,2048,768,8,128,4,1,power_law_1.2,0.1121664047241211
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,2048,768,8,128,4,1,power_law_1.2,0.11931519508361817
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,2048,768,8,128,4,1,power_law_1.2,0.2124351978302002
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,2048,768,8,128,4,1,power_law_1.2,0.13003519773483277
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,2048,768,8,128,4,1,power_law_1.2,0.25156478881835936
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,2048,768,8,128,4,1,power_law_1.2,0.1453760027885437
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,2048,768,8,128,4,1,power_law_1.2,0.2823231935501099
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,2048,768,8,128,4,1,power_law_1.2,0.1739456057548523
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,2048,768,8,128,4,1,power_law_1.2,0.3751039981842041
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,2048,768,8,128,4,1,power_law_1.2,0.19119999408721924
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,2048,768,8,128,4,1,power_law_1.2,0.45165438652038575
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,2048,768,8,128,4,1,power_law_1.2,0.24063360691070557
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,2048,768,8,128,4,1,power_law_1.2,0.2884799957275391
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,2048,768,8,128,4,1,power_law_1.2,0.6173952102661133
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,2048,768,8,128,4,1,balanced,6.121946970621745
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,2048,768,8,128,4,1,power_law_1.2,0.388102388381958
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,2048,768,8,128,4,1,power_law_1.2,0.787660789489746
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,2048,768,8,128,4,1,power_law_1.2,0.4877120018005371
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,2048,768,8,128,4,1,power_law_1.2,1.1420351982116699
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,2048,768,8,128,4,1,power_law_1.2,0.686137580871582
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,2048,768,8,128,4,1,balanced,6.813957214355469
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,2048,768,8,128,4,1,power_law_1.2,1.4585856437683105
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,2048,768,8,128,4,1,power_law_1.2,0.8863103866577149
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,2048,768,8,128,4,1,power_law_1.2,1.8058624267578125
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,2048,768,8,128,4,1,power_law_1.2,1.303705596923828
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,2048,768,8,128,4,1,power_law_1.2,2.9209663391113283
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,2048,768,8,128,4,1,power_law_1.2,1.7366464614868165
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,2048,768,8,128,4,1,power_law_1.2,2.152095985412598
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,2048,768,8,128,4,1,power_law_1.2,6.155987167358399
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,2048,768,8,128,4,1,power_law_1.2,3.4431167602539063
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,2048,768,8,128,4,1,power_law_1.2,7.027110290527344
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,2048,768,8,128,4,1,balanced,12.127787272135416
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,2048,768,8,128,4,1,power_law_1.2,0.052108800411224364
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,2048,768,8,128,4,1,power_law_1.2,0.06353920102119445
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,2048,768,8,128,4,1,power_law_1.2,0.06566399931907654
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,2048,768,8,128,4,1,power_law_1.2,0.07209600210189819
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,2048,768,8,128,4,1,power_law_1.2,0.07902719974517822
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,2048,768,8,128,4,1,power_law_1.2,0.09568639993667602
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,4096,1536,8,128,1,4,balanced,0.040106666584809623
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,2048,768,8,128,4,1,power_law_1.2,0.09959040284156799
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,4096,1536,8,128,1,4,balanced,0.05106666684150696
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,2048,768,8,128,4,1,power_law_1.2,0.10635520219802856
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,4096,1536,8,128,1,4,balanced,0.049039999643961586
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,4096,1536,8,128,1,4,balanced,0.06198399762312571
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,2048,768,8,128,4,1,power_law_1.2,0.11138559579849243
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,4096,1536,8,128,1,4,balanced,0.09502399961153667
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,2048,768,8,128,4,1,power_law_1.2,0.11414400339126587
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,4096,1536,8,128,1,4,balanced,0.06806399921576183
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,2048,768,8,128,4,1,power_law_1.2,0.12239999771118164
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,4096,1536,8,128,1,4,balanced,0.17091200749079385
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,2048,768,8,128,4,1,power_law_1.2,0.13226239681243895
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,4096,1536,8,128,1,4,balanced,0.10443199674288432
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,4096,1536,8,128,1,4,balanced,0.304149329662323
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,2048,768,8,128,4,1,power_law_1.2,0.14010239839553834
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,2048,768,8,128,4,1,power_law_1.2,0.15343999862670898
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,4096,1536,8,128,1,4,balanced,0.17449599504470825
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,4096,1536,8,128,1,4,balanced,0.3076853354771932
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,4096,1536,8,128,1,4,balanced,0.17656532923380533
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,4096,1536,8,128,1,4,balanced,0.3060266574223836
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,2048,768,8,128,4,1,power_law_1.2,0.1695680022239685
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,4096,1536,8,128,1,4,balanced,0.3070026636123657
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,4096,1536,8,128,1,4,balanced,0.17715734243392944
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,2048,768,8,128,4,1,power_law_1.2,0.18142720460891723
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,4096,1536,8,128,1,4,balanced,0.17706133921941122
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,4096,1536,8,128,1,4,balanced,0.30776532491048175
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,4096,1536,8,128,1,4,balanced,0.30869332949320477
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,4096,1536,8,128,1,4,balanced,0.17926400899887085
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,4096,1536,8,128,1,4,balanced,0.17965867122014365
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,4096,1536,8,128,1,4,balanced,0.31010133028030396
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,2048,768,8,128,4,1,power_law_1.2,0.190937602519989
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,2048,768,8,128,4,1,power_law_1.2,0.24046719074249268
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,4096,1536,8,128,1,4,balanced,0.31221334139506024
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,4096,1536,8,128,1,4,balanced,0.18220800161361694
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,2048,768,8,128,4,1,power_law_1.2,0.29224319458007814
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,4096,1536,8,128,1,4,balanced,0.3137120008468628
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,4096,1536,8,128,1,4,balanced,0.18408000469207764
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,2048,768,8,128,4,1,power_law_1.2,0.40500478744506835
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,4096,1536,8,128,1,4,balanced,0.31699732939402264
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,2048,768,8,128,4,1,power_law_1.2,0.49625601768493655
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,4096,1536,8,128,1,4,balanced,0.18672533830006918
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,2048,768,8,128,4,1,power_law_1.2,0.6834688186645508
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,4096,1536,8,128,1,4,balanced,0.3344159921010335
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,4096,1536,8,128,1,4,balanced,0.18951465686162314
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,2048,768,8,128,4,1,power_law_1.2,0.8660672187805176
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,4096,1536,8,128,1,4,balanced,0.3412799835205078
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,4096,1536,8,128,1,4,balanced,0.1986666719118754
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,2048,768,8,128,4,1,power_law_1.2,1.243718433380127
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,4096,1536,8,128,1,4,balanced,0.1987733244895935
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,2048,768,8,128,4,1,power_law_1.2,1.6291328430175782
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,4096,1536,8,128,1,4,balanced,0.34433066844940186
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,2048,768,8,128,4,1,power_law_1.2,2.3841856002807615
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,4096,1536,8,128,1,4,balanced,0.20770132541656494
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,4096,1536,8,128,1,4,balanced,0.35499731699625653
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,2048,768,8,128,4,1,power_law_1.2,3.1343488693237305
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,4096,1536,8,128,1,4,balanced,0.2209333380063375
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,4096,1536,8,128,1,4,balanced,0.3765600124994914
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,2048,768,8,128,4,1,power_law_1.2,3.8911808013916014
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,4096,1536,8,128,1,4,balanced,0.24126933018366495
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,4096,1536,8,128,1,4,balanced,0.398144006729126
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,2048,768,8,128,4,1,power_law_1.2,6.132076644897461
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,4096,1536,8,128,1,4,balanced,0.2630293369293213
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,4096,1536,8,128,1,4,balanced,0.4163573185602824
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,2048,768,8,128,4,1,power_law_1.2,12.172064208984375
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,4096,1536,8,128,1,4,balanced,0.2877279917399089
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,4096,1536,8,128,1,4,balanced,0.5286933183670044
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,4096,1536,8,128,1,4,balanced,0.37987732887268066
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,4096,1536,8,128,1,4,balanced,0.039279999832312264
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,4096,1536,8,128,1,4,balanced,0.5798720121383667
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,4096,1536,8,128,1,4,balanced,0.04720533390839895
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,4096,1536,8,128,1,4,balanced,0.42601601282755536
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,4096,1536,8,128,1,4,balanced,0.06513066589832306
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,4096,1536,8,128,1,4,balanced,0.1027893324693044
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,4096,1536,8,128,1,4,balanced,0.17309866348902384
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,4096,1536,8,128,1,4,balanced,0.7813440163930258
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,4096,1536,8,128,1,4,balanced,0.17442133029301962
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,4096,1536,8,128,1,4,balanced,0.17787732680638632
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,4096,1536,8,128,1,4,balanced,0.5912906726201376
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,4096,1536,8,128,1,4,balanced,0.17867734034856161
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,4096,1536,8,128,1,4,balanced,0.17883733908335367
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,4096,1536,8,128,1,4,power_law_1.01,0.10079360008239746
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,4096,1536,8,128,1,4,balanced,0.18118933836619058
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,4096,1536,8,128,1,4,balanced,1.0134186744689941
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,4096,1536,8,128,1,4,balanced,0.18338666359583536
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,4096,1536,8,128,1,4,power_law_1.01,0.08085759878158569
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,4096,1536,8,128,1,4,balanced,0.7598559856414795
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,4096,1536,8,128,1,4,balanced,0.18756266434987387
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,4096,1536,8,128,1,4,power_law_1.01,0.0881663978099823
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,4096,1536,8,128,1,4,balanced,0.19064533710479736
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,4096,1536,8,128,1,4,power_law_1.01,0.14525439739227294
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,4096,1536,8,128,1,4,balanced,0.19625065724054971
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,4096,1536,8,128,1,4,power_law_1.01,0.173088002204895
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,4096,1536,8,128,1,4,power_law_1.01,0.2723520040512085
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,4096,1536,8,128,1,4,power_law_1.01,0.06798080205917359
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,4096,1536,8,128,1,4,power_law_1.01,0.26051840782165525
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,4096,1536,8,128,1,4,balanced,1.4799466133117676
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,4096,1536,8,128,1,4,power_law_1.01,0.2856640100479126
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,4096,1536,8,128,1,4,power_law_1.01,0.0721343994140625
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,4096,1536,8,128,1,4,balanced,1.1150293350219727
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,4096,1536,8,128,1,4,power_law_1.01,0.2905791997909546
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,4096,1536,8,128,1,4,power_law_1.01,0.060652798414230345
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,4096,1536,8,128,1,4,balanced,0.20635199546813965
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,4096,1536,8,128,1,4,power_law_1.01,0.29385600090026853
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,4096,1536,8,128,1,4,power_law_1.01,0.09392639994621277
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,4096,1536,8,128,1,4,balanced,0.21092800299326578
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,4096,1536,8,128,1,4,power_law_1.01,0.3012095928192139
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,4096,1536,8,128,1,4,power_law_1.01,0.1167296051979065
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,4096,1536,8,128,1,4,power_law_1.01,0.3131711959838867
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,4096,1536,8,128,1,4,power_law_1.01,0.15973759889602662
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,4096,1536,8,128,1,4,power_law_1.01,0.06812800168991089
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,4096,1536,8,128,1,4,power_law_1.01,0.32529919147491454
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,4096,1536,8,128,1,4,power_law_1.01,0.1641152024269104
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,4096,1536,8,128,1,4,power_law_1.01,0.05782399773597717
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,4096,1536,8,128,1,4,power_law_1.01,0.3493760108947754
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,4096,1536,8,128,1,4,balanced,1.949621359507243
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,4096,1536,8,128,1,4,power_law_1.01,0.16636799573898314
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,4096,1536,8,128,1,4,power_law_1.01,0.061440002918243405
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,4096,1536,8,128,1,4,power_law_1.01,0.3602368116378784
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,4096,1536,8,128,1,4,power_law_1.01,0.17339520454406737
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,4096,1536,8,128,1,4,balanced,1.4507840474446614
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,4096,1536,8,128,1,4,power_law_1.01,0.08654080033302307
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,4096,1536,8,128,1,4,power_law_1.01,0.38049280643463135
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,4096,1536,8,128,1,4,power_law_1.01,0.1738368034362793
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,4096,1536,8,128,1,4,power_law_1.01,0.11389440298080444
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,4096,1536,8,128,1,4,power_law_1.01,0.36239359378814695
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,4096,1536,8,128,1,4,power_law_1.01,0.18509440422058104
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,4096,1536,8,128,1,4,power_law_1.01,0.1477504014968872
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,4096,1536,8,128,1,4,power_law_1.01,0.1958143949508667
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,4096,1536,8,128,1,4,power_law_1.01,0.43512959480285646
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,4096,1536,8,128,1,4,balanced,0.22753065824508667
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,4096,1536,8,128,1,4,power_law_1.01,0.16895359754562378
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,4096,1536,8,128,1,4,power_law_1.01,0.2025599956512451
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,4096,1536,8,128,1,4,power_law_1.01,0.16227840185165404
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,4096,1536,8,128,1,4,power_law_1.01,0.4328000068664551
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,4096,1536,8,128,1,4,balanced,0.2525920073191325
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,4096,1536,8,128,1,4,power_law_1.01,0.19865599870681763
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,4096,1536,8,128,1,4,power_law_1.01,0.16992640495300293
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,4096,1536,8,128,1,4,power_law_1.01,0.48114562034606934
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,4096,1536,8,128,1,4,power_law_1.2,0.10106879472732544
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,4096,1536,8,128,1,4,balanced,0.2690719962120056
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,4096,1536,8,128,1,4,power_law_1.01,0.2075200080871582
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,4096,1536,8,128,1,4,power_law_1.01,0.18526079654693603
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,4096,1536,8,128,1,4,power_law_1.01,0.5871808052062988
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,4096,1536,8,128,1,4,power_law_1.2,0.06586880087852479
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,4096,1536,8,128,1,4,balanced,2.4260427157084146
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,4096,1536,8,128,1,4,power_law_1.01,0.21788160800933837
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,4096,1536,8,128,1,4,power_law_1.01,0.19557759761810303
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,4096,1536,8,128,1,4,power_law_1.01,0.7108479976654053
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,4096,1536,8,128,1,4,power_law_1.2,0.08906880021095276
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,4096,1536,8,128,1,4,balanced,0.34138135115305585
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,4096,1536,8,128,1,4,balanced,1.815242608388265
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,4096,1536,8,128,1,4,power_law_1.01,0.21953918933868408
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,4096,1536,8,128,1,4,power_law_1.01,0.20650880336761473
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,4096,1536,8,128,1,4,power_law_1.2,0.1395967960357666
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,4096,1536,8,128,1,4,power_law_1.01,0.8363967895507812
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,4096,1536,8,128,1,4,power_law_1.01,0.26039040088653564
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,4096,1536,8,128,1,4,power_law_1.01,0.2178368091583252
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,4096,1536,8,128,1,4,balanced,0.3900959889094035
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,4096,1536,8,128,1,4,power_law_1.2,0.17136640548706056
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,4096,1536,8,128,1,4,power_law_1.01,1.0907520294189452
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,4096,1536,8,128,1,4,power_law_1.01,0.28457601070404054
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,4096,1536,8,128,1,4,power_law_1.01,0.23827199935913085
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,4096,1536,8,128,1,4,power_law_1.2,0.2643647909164429
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,4096,1536,8,128,1,4,power_law_1.01,1.4081855773925782
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,4096,1536,8,128,1,4,power_law_1.01,0.3398655891418457
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,4096,1536,8,128,1,4,balanced,0.5894773403803507
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,4096,1536,8,128,1,4,power_law_1.2,0.28012800216674805
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,4096,1536,8,128,1,4,power_law_1.01,0.3856127977371216
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,4096,1536,8,128,1,4,power_law_1.01,2.1963903427124025
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,4096,1536,8,128,1,4,power_law_1.2,0.29259519577026366
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,4096,1536,8,128,1,4,power_law_1.01,0.4820672035217285
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,4096,1536,8,128,1,4,power_law_1.01,0.2558144092559814
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,4096,1536,8,128,1,4,power_law_1.01,2.6346879959106446
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,4096,1536,8,128,1,4,power_law_1.2,0.2996608018875122
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,4096,1536,8,128,1,4,power_law_1.01,0.6057024002075195
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,4096,1536,8,128,1,4,balanced,0.6841866970062256
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,4096,1536,8,128,1,4,power_law_1.01,0.26527359485626223
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,4096,1536,8,128,1,4,power_law_1.2,0.3044735908508301
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,4096,1536,8,128,1,4,power_law_1.01,3.230809783935547
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,4096,1536,8,128,1,4,power_law_1.01,0.8182271957397461
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,4096,1536,8,128,1,4,power_law_1.2,0.32074880599975586
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,4096,1536,8,128,1,4,power_law_1.01,0.9927807807922363
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,4096,1536,8,128,1,4,power_law_1.01,4.826208114624023
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,4096,1536,8,128,1,4,power_law_1.01,0.26116480827331545
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,4096,1536,8,128,1,4,power_law_1.2,0.3296832084655762
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,4096,1536,8,128,1,4,power_law_1.01,1.4906496047973632
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,4096,1536,8,128,1,4,balanced,0.9956426620483398
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,4096,1536,8,128,1,4,power_law_1.01,0.3155904054641724
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,4096,1536,8,128,1,4,power_law_1.2,0.351308798789978
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,4096,1536,8,128,1,4,power_law_1.01,1.880415916442871
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,4096,1536,8,128,1,4,power_law_1.01,10.111705780029297
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,4096,1536,8,128,1,4,power_law_1.01,0.3547327995300293
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,4096,1536,8,128,1,4,power_law_1.2,0.34736640453338624
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,4096,1536,8,128,1,4,power_law_1.01,2.5361215591430666
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,4096,1536,8,128,1,4,power_law_1.01,0.4819007873535156
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,4096,1536,8,128,1,4,power_law_1.2,0.3828671932220459
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,4096,1536,8,128,1,4,balanced,3.777162551879883
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,4096,1536,8,128,1,4,balanced,2.84660275777181
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,4096,1536,8,128,1,4,power_law_1.01,3.4897216796875
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,4096,1536,8,128,1,4,balanced,1.3090186913808186
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,4096,1536,8,128,1,4,power_law_1.01,0.5658880233764648
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,4096,1536,8,128,1,4,power_law_1.2,0.4144896030426025
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,4096,1536,8,128,1,4,power_law_1.2,0.3944767951965332
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,4096,1536,8,128,1,4,power_law_1.01,0.772211217880249
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,4096,1536,8,128,1,4,power_law_1.01,7.484941101074218
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,4096,1536,8,128,1,4,power_law_1.2,0.4582784175872803
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,4096,1536,8,128,1,4,power_law_1.01,0.9836607933044433
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,4096,1536,8,128,1,4,power_law_1.2,0.4490367889404297
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,4096,1536,8,128,1,4,power_law_1.01,1.3815999984741212
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,4096,1536,8,128,1,4,power_law_1.2,0.5286143779754638
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,4096,1536,8,128,1,4,power_law_1.01,1.8175296783447266
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,4096,1536,8,128,1,4,balanced,1.9431254069010417
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,4096,1536,8,128,1,4,power_law_1.2,0.6197824001312255
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,4096,1536,8,128,1,4,power_law_1.01,2.6671743392944336
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,4096,1536,8,128,1,4,power_law_1.2,0.8060735702514649
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,4096,1536,8,128,1,4,power_law_1.01,3.700979232788086
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,4096,1536,8,128,1,4,power_law_1.2,0.9488063812255859
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,4096,1536,8,128,1,4,power_law_1.01,4.4804542541503904
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,4096,1536,8,128,1,4,power_law_1.2,1.2995840072631837
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,4096,1536,8,128,1,4,power_law_1.01,6.8661247253417965
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,4096,1536,8,128,1,4,power_law_1.2,1.574681568145752
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,4096,1536,8,128,1,4,power_law_1.2,2.651020812988281
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,4096,1536,8,128,1,4,balanced,2.5804266929626465
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,4096,1536,8,128,1,4,power_law_1.01,13.334182739257812
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,4096,1536,8,128,1,4,power_law_1.2,3.208281707763672
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,4096,1536,8,128,1,4,power_law_1.2,4.444902420043945
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,4096,1536,8,128,1,4,power_law_1.2,7.0447746276855465
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,4096,1536,8,128,1,4,power_law_1.2,15.19354248046875
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,4096,1536,8,128,1,4,balanced,3.2075894673665366
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,4096,1536,8,128,1,4,balanced,5.635397593180339
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,4096,1536,8,128,1,4,balanced,7.37282117207845
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,4096,1536,8,128,1,4,power_law_1.2,0.06398720145225525
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,4096,1536,8,128,1,4,power_law_1.2,0.045049598813056944
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,4096,1536,8,128,1,4,power_law_1.2,0.06351360082626342
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,4096,1536,8,128,1,4,power_law_1.2,0.08047360181808472
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,4096,1536,8,128,1,4,power_law_1.2,0.0890496015548706
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,4096,1536,8,128,1,4,power_law_1.2,0.163481605052948
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,4096,1536,8,128,1,4,power_law_1.2,0.15964159965515137
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,4096,1536,8,128,1,4,power_law_1.2,0.17582080364227295
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,4096,1536,8,128,1,4,power_law_1.2,0.17196160554885864
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,4096,1536,8,128,1,4,balanced,5.093157450358073
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,4096,1536,8,128,1,4,power_law_1.2,0.17843199968338014
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,4096,1536,8,128,1,4,power_law_1.2,0.17945599555969238
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,4096,1536,8,128,1,4,power_law_1.2,0.1962048053741455
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,4096,1536,8,128,1,4,power_law_1.2,0.2092479944229126
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,4096,1536,8,128,1,4,power_law_1.2,0.2065279960632324
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,4096,1536,8,128,1,4,power_law_1.2,0.21972479820251464
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,4096,1536,8,128,1,4,power_law_1.2,0.23055999279022216
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,4096,1536,8,128,1,4,power_law_1.2,0.23281280994415282
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,4096,1536,8,128,1,4,power_law_1.2,0.28134400844573976
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,4096,1536,8,128,1,4,power_law_1.2,0.3064448118209839
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,4096,1536,8,128,1,4,power_law_1.2,0.3476032018661499
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,4096,1536,8,128,1,4,power_law_1.2,0.40849919319152833
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,4096,1536,8,128,1,4,power_law_1.2,0.558400011062622
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,4096,1536,8,128,1,4,power_law_1.2,0.6925631999969483
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,4096,1536,8,128,1,4,power_law_1.2,0.8566271781921386
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,4096,1536,8,128,1,4,power_law_1.2,1.2255423545837403
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,4096,1536,8,128,1,4,power_law_1.2,1.6638143539428711
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,4096,1536,8,128,1,4,power_law_1.2,2.3546432495117187
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,4096,1536,8,128,1,4,power_law_1.2,2.814201545715332
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,4096,1536,8,128,1,4,power_law_1.2,5.083206558227539
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,4096,1536,8,128,1,4,power_law_1.2,8.954374694824219
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,4096,1536,8,128,1,4,balanced,10.11463991800944
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,4096,1536,8,128,2,2,balanced,0.049178664882977806
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,4096,1536,8,128,2,2,balanced,0.06365333497524261
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,4096,1536,8,128,2,2,balanced,0.09657067060470581
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,4096,1536,8,128,1,4,power_law_1.2,0.06796799898147583
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,4096,1536,8,128,2,2,balanced,0.1688693364461263
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,4096,1536,8,128,2,2,balanced,0.038575999438762665
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,4096,1536,8,128,2,2,balanced,0.30504000186920166
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,4096,1536,8,128,1,4,power_law_1.2,0.05108479857444763
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,4096,1536,8,128,2,2,balanced,0.3116319974263509
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,4096,1536,8,128,2,2,balanced,0.04970133304595947
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,4096,1536,8,128,1,4,power_law_1.2,0.06743040084838867
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,4096,1536,8,128,2,2,balanced,0.31173332532246906
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,4096,1536,8,128,2,2,balanced,0.0673226664463679
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,4096,1536,8,128,1,4,power_law_1.2,0.08599039912223816
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,4096,1536,8,128,2,2,balanced,0.3107840021451314
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,4096,1536,8,128,2,2,balanced,0.10686399539311726
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,4096,1536,8,128,1,4,power_law_1.2,0.09827200174331666
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,4096,1536,8,128,2,2,balanced,0.3128959933916728
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,4096,1536,8,128,2,2,balanced,0.1779306729634603
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,4096,1536,8,128,1,4,power_law_1.2,0.15171200037002563
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,4096,1536,8,128,2,2,balanced,0.31153066953023273
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,4096,1536,8,128,2,2,balanced,0.1797813375790914
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,4096,1536,8,128,2,2,balanced,0.31725867589314777
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,4096,1536,8,128,1,4,power_law_1.2,0.16660480499267577
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,4096,1536,8,128,2,2,balanced,0.1797813375790914
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,4096,1536,8,128,2,2,balanced,0.31808000802993774
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,4096,1536,8,128,1,4,power_law_1.2,0.17036800384521483
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,4096,1536,8,128,2,2,balanced,0.18150933583577475
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,4096,1536,8,128,2,2,balanced,0.3219839930534363
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,4096,1536,8,128,1,4,power_law_1.2,0.1776128053665161
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,4096,1536,8,128,2,2,balanced,0.18544000387191772
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,4096,1536,8,128,2,2,balanced,0.3247893253962199
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,4096,1536,8,128,2,2,balanced,0.18490666151046753
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,4096,1536,8,128,1,4,power_law_1.2,0.18787839412689208
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,4096,1536,8,128,2,2,balanced,0.18802666664123535
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,4096,1536,8,128,2,2,balanced,0.34090665976206463
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,4096,1536,8,128,1,4,power_law_1.2,0.19827200174331666
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,4096,1536,8,128,2,2,balanced,0.19211200873057047
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,4096,1536,8,128,1,4,power_law_1.2,0.20506880283355713
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,4096,1536,8,128,2,2,balanced,0.34513068199157715
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,4096,1536,8,128,1,4,power_law_1.2,0.21790080070495604
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,4096,1536,8,128,2,2,balanced,0.195306658744812
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,4096,1536,8,128,2,2,balanced,0.3594826857248942
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,4096,1536,8,128,1,4,power_law_1.2,0.25061759948730467
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,4096,1536,8,128,2,2,balanced,0.19831466674804688
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,4096,1536,8,128,2,2,balanced,0.37995731830596924
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,4096,1536,8,128,2,2,balanced,0.20643200476964316
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,4096,1536,8,128,2,2,balanced,0.40241066614786786
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,4096,1536,8,128,2,2,balanced,0.21158933639526367
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,4096,1536,8,128,1,4,power_law_1.2,0.24995200634002684
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,4096,1536,8,128,1,4,power_law_1.2,0.2707456111907959
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,4096,1536,8,128,2,2,balanced,0.2262880007425944
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,4096,1536,8,128,2,2,balanced,0.4338933229446411
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,4096,1536,8,128,2,2,power_law_1.01,0.048172798752784726
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,4096,1536,8,128,2,2,power_law_1.01,0.06313599944114685
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,4096,1536,8,128,2,2,balanced,0.24586133162180582
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,4096,1536,8,128,2,2,power_law_1.01,0.05694079995155334
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,4096,1536,8,128,2,2,power_law_1.01,0.048179200291633605
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,4096,1536,8,128,2,2,balanced,0.46797335147857666
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,4096,1536,8,128,1,4,power_law_1.2,0.2645312070846558
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,4096,1536,8,128,2,2,balanced,0.27115732431411743
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,4096,1536,8,128,2,2,power_law_1.01,0.08999040126800537
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,4096,1536,8,128,2,2,power_law_1.01,0.05797119736671448
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,4096,1536,8,128,1,4,power_law_1.2,0.337939190864563
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,4096,1536,8,128,2,2,power_law_1.01,0.12777600288391114
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,4096,1536,8,128,2,2,power_law_1.01,0.08786560297012329
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,4096,1536,8,128,2,2,balanced,0.5912319819132487
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,4096,1536,8,128,2,2,balanced,0.30827200412750244
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,4096,1536,8,128,1,4,power_law_1.2,0.3751039981842041
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,4096,1536,8,128,2,2,power_law_1.01,0.17249280214309692
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,4096,1536,8,128,2,2,power_law_1.01,0.10170880556106568
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,4096,1536,8,128,1,4,power_law_1.2,0.4855679988861084
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,4096,1536,8,128,2,2,balanced,0.04736533264319102
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,4096,1536,8,128,2,2,power_law_1.01,0.2672255992889404
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,4096,1536,8,128,2,2,balanced,0.34145601590474445
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,4096,1536,8,128,2,2,power_law_1.01,0.1589951992034912
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,4096,1536,8,128,2,2,balanced,0.6585386594136556
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,4096,1536,8,128,1,4,power_law_1.2,0.614028787612915
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,4096,1536,8,128,2,2,power_law_1.01,0.26299519538879396
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,4096,1536,8,128,2,2,balanced,0.054474666714668274
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,4096,1536,8,128,2,2,power_law_1.01,0.16017279624938965
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,4096,1536,8,128,2,2,power_law_1.01,0.2883647918701172
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,4096,1536,8,128,1,4,power_law_1.2,0.8192319869995117
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,4096,1536,8,128,2,2,balanced,0.0711413323879242
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,4096,1536,8,128,2,2,balanced,0.47545599937438965
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,4096,1536,8,128,2,2,power_law_1.01,0.16494719982147216
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,4096,1536,8,128,2,2,power_law_1.01,0.29142398834228517
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,4096,1536,8,128,2,2,balanced,0.11034666498502095
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,4096,1536,8,128,1,4,power_law_1.2,1.0382783889770508
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,4096,1536,8,128,2,2,power_law_1.01,0.17386879920959472
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,4096,1536,8,128,2,2,power_law_1.01,0.30023679733276365
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,4096,1536,8,128,2,2,balanced,0.9207413196563721
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,4096,1536,8,128,2,2,balanced,0.18118399381637573
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,4096,1536,8,128,1,4,power_law_1.2,1.608403205871582
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,4096,1536,8,128,2,2,balanced,0.5495680173238119
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,4096,1536,8,128,2,2,power_law_1.01,0.17699840068817138
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,4096,1536,8,128,2,2,power_law_1.01,0.30760319232940675
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,4096,1536,8,128,2,2,balanced,0.18481600284576416
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,4096,1536,8,128,1,4,power_law_1.2,2.1893695831298827
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,4096,1536,8,128,2,2,balanced,0.1874986688296
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,4096,1536,8,128,2,2,power_law_1.01,0.32220160961151123
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,4096,1536,8,128,2,2,power_law_1.01,0.18528640270233154
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,4096,1536,8,128,1,4,power_law_1.2,3.407622528076172
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,4096,1536,8,128,2,2,balanced,0.18994667132695517
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,4096,1536,8,128,2,2,power_law_1.01,0.3296063899993896
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,4096,1536,8,128,2,2,power_law_1.01,0.1944640040397644
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,4096,1536,8,128,2,2,balanced,0.19034133354822794
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,4096,1536,8,128,2,2,power_law_1.01,0.3462591886520386
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,4096,1536,8,128,2,2,balanced,1.2066506544748943
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,4096,1536,8,128,2,2,balanced,0.7782666683197021
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,4096,1536,8,128,1,4,power_law_1.2,4.434675216674805
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,4096,1536,8,128,2,2,power_law_1.01,0.19993599653244018
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,4096,1536,8,128,2,2,balanced,0.1955839991569519
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,4096,1536,8,128,2,2,power_law_1.01,0.35990400314331056
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,4096,1536,8,128,2,2,power_law_1.01,0.20609920024871825
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,4096,1536,8,128,1,4,power_law_1.2,5.783302307128906
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,4096,1536,8,128,2,2,balanced,0.19684799512227377
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,4096,1536,8,128,2,2,power_law_1.01,0.3628223896026611
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,4096,1536,8,128,2,2,power_law_1.01,0.21814401149749757
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,4096,1536,8,128,2,2,power_law_1.01,0.3820607900619507
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,4096,1536,8,128,2,2,balanced,0.20378132661183676
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,4096,1536,8,128,1,4,power_law_1.2,9.50887680053711
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,4096,1536,8,128,2,2,power_law_1.01,0.22817280292510986
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,4096,1536,8,128,2,2,power_law_1.01,0.42172799110412595
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,4096,1536,8,128,2,2,balanced,0.20915732781092325
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,4096,1536,8,128,2,2,balanced,1.0137386322021484
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,4096,1536,8,128,2,2,power_law_1.01,0.2415616035461426
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,4096,1536,8,128,2,2,power_law_1.01,0.4311103820800781
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,4096,1536,8,128,2,2,balanced,0.21588265895843506
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,4096,1536,8,128,2,2,power_law_1.01,0.26857600212097166
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,4096,1536,8,128,2,2,balanced,1.7803893089294434
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,4096,1536,8,128,2,2,power_law_1.01,0.5034495830535889
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,4096,1536,8,128,1,4,power_law_1.2,18.238841247558593
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,4096,1536,8,128,2,2,power_law_1.01,0.2949696063995361
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,4096,1536,8,128,2,2,power_law_1.01,0.5721280097961425
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,4096,1536,8,128,2,2,power_law_1.01,0.3615744113922119
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,4096,1536,8,128,2,2,power_law_1.01,0.692409610748291
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,4096,1536,8,128,2,2,power_law_1.01,0.4070784091949463
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,4096,1536,8,128,2,2,balanced,0.23438400030136108
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,4096,1536,8,128,2,2,power_law_1.01,0.8903743743896484
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,4096,1536,8,128,2,2,balanced,1.4972853660583496
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,4096,1536,8,128,2,2,power_law_1.01,0.5400383949279786
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,4096,1536,8,128,2,2,power_law_1.01,1.1691455841064453
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,4096,1536,8,128,2,2,balanced,0.24097599585851034
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,4096,1536,8,128,2,2,power_law_1.01,0.6460288047790528
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,4096,1536,8,128,2,2,power_law_1.01,1.477894401550293
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,4096,1536,8,128,2,2,power_law_1.01,0.9053567886352539
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,4096,1536,8,128,2,2,power_law_1.01,2.1810047149658205
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,4096,1536,8,128,2,2,balanced,2.335082689921061
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,4096,1536,8,128,2,2,power_law_1.01,1.161843204498291
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,4096,1536,8,128,2,2,power_law_1.01,2.951136016845703
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,4096,1536,8,128,2,2,power_law_1.01,1.6427711486816405
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,4096,1536,8,128,2,2,power_law_1.01,3.514188766479492
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,4096,1536,8,128,2,2,balanced,0.271509329477946
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,4096,1536,8,128,2,2,power_law_1.01,2.097395133972168
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,4096,1536,8,128,2,2,balanced,1.9708266258239746
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,4096,1536,8,128,2,2,power_law_1.01,5.253459167480469
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,4096,1536,8,128,2,2,balanced,0.31617067257563275
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,4096,1536,8,128,2,2,power_law_1.01,2.6284671783447267
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,4096,1536,8,128,2,2,balanced,0.35678398609161377
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,4096,1536,8,128,2,2,power_law_1.01,4.338246536254883
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,4096,1536,8,128,2,2,power_law_1.01,10.67413787841797
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,4096,1536,8,128,2,2,power_law_1.2,0.06206079721450806
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,4096,1536,8,128,2,2,balanced,0.47491200764973956
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,4096,1536,8,128,2,2,power_law_1.2,0.05363839864730835
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,4096,1536,8,128,2,2,power_law_1.01,8.975033569335938
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,4096,1536,8,128,2,2,power_law_1.01,0.05727999806404114
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,4096,1536,8,128,2,2,balanced,2.926266670227051
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,4096,1536,8,128,2,2,balanced,0.544047991434733
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,4096,1536,8,128,2,2,power_law_1.2,0.07765120267868042
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,4096,1536,8,128,2,2,power_law_1.01,0.06170240044593811
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,4096,1536,8,128,2,2,power_law_1.2,0.111244797706604
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,4096,1536,8,128,2,2,power_law_1.01,0.06373760104179382
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,4096,1536,8,128,2,2,power_law_1.01,0.08341119885444641
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,4096,1536,8,128,2,2,balanced,0.8432532946268717
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,4096,1536,8,128,2,2,power_law_1.2,0.14897919893264772
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,4096,1536,8,128,2,2,power_law_1.01,0.11173759698867798
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,4096,1536,8,128,2,2,balanced,2.4478185971577964
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,4096,1536,8,128,2,2,power_law_1.2,0.25766398906707766
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,4096,1536,8,128,2,2,power_law_1.01,0.1608448028564453
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,4096,1536,8,128,2,2,power_law_1.01,0.16582399606704712
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,4096,1536,8,128,2,2,power_law_1.2,0.2813184022903442
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,4096,1536,8,128,2,2,balanced,1.0032959779103596
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,4096,1536,8,128,2,2,power_law_1.01,0.1815616011619568
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,4096,1536,8,128,2,2,power_law_1.2,0.29184000492095946
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,4096,1536,8,128,2,2,power_law_1.01,0.18456319570541382
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,4096,1536,8,128,2,2,power_law_1.01,0.19218560457229614
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,4096,1536,8,128,2,2,power_law_1.2,0.3019392013549805
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,4096,1536,8,128,2,2,power_law_1.01,0.2031615972518921
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,4096,1536,8,128,2,2,power_law_1.2,0.3002432107925415
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,4096,1536,8,128,2,2,power_law_1.01,0.22676479816436768
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,4096,1536,8,128,2,2,balanced,1.4668426513671875
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,4096,1536,8,128,2,2,power_law_1.01,0.23529601097106934
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,4096,1536,8,128,2,2,power_law_1.2,0.31729280948638916
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,4096,1536,8,128,2,2,power_law_1.01,0.257043194770813
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,4096,1536,8,128,2,2,power_law_1.2,0.3246527910232544
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,4096,1536,8,128,2,2,power_law_1.2,0.3401599884033203
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,4096,1536,8,128,2,2,power_law_1.01,0.2661504030227661
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,4096,1536,8,128,2,2,power_law_1.2,0.33958399295806885
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,4096,1536,8,128,2,2,balanced,1.9332106908162434
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,4096,1536,8,128,2,2,power_law_1.01,0.27985920906066897
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,4096,1536,8,128,2,2,balanced,4.6272586186726885
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,4096,1536,8,128,2,2,power_law_1.2,0.36285440921783446
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,4096,1536,8,128,2,2,power_law_1.2,0.3830912113189697
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,4096,1536,8,128,2,2,power_law_1.01,0.2988095998764038
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,4096,1536,8,128,2,2,power_law_1.2,0.40352640151977537
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,4096,1536,8,128,2,2,power_law_1.01,0.36353919506072996
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,4096,1536,8,128,2,2,power_law_1.2,0.4517055988311768
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,4096,1536,8,128,2,2,balanced,3.7670774459838867
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,4096,1536,8,128,2,2,power_law_1.01,0.44929919242858884
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,4096,1536,8,128,2,2,power_law_1.2,0.45045762062072753
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,4096,1536,8,128,2,2,power_law_1.01,0.5843520164489746
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,4096,1536,8,128,2,2,balanced,2.8483734130859375
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,4096,1536,8,128,2,2,power_law_1.01,0.6744256019592285
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,4096,1536,8,128,2,2,power_law_1.2,0.5153215885162353
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,4096,1536,8,128,2,2,power_law_1.01,0.9515456199645996
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,4096,1536,8,128,2,2,power_law_1.2,0.6211008071899414
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,4096,1536,8,128,2,2,power_law_1.01,1.2298687934875487
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,4096,1536,8,128,2,2,power_law_1.2,0.7582975864410401
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,4096,1536,8,128,2,2,power_law_1.01,1.7059263229370116
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,4096,1536,8,128,2,2,power_law_1.2,0.9932991981506347
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,4096,1536,8,128,2,2,power_law_1.01,2.1927040100097654
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,4096,1536,8,128,2,2,power_law_1.2,1.2742912292480468
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,4096,1536,8,128,2,2,power_law_1.01,3.225331115722656
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,4096,1536,8,128,2,2,power_law_1.01,4.283103942871094
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,4096,1536,8,128,2,2,power_law_1.2,1.4857600212097168
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,4096,1536,8,128,2,2,power_law_1.01,5.108550262451172
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,4096,1536,8,128,2,2,power_law_1.2,2.134297561645508
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,4096,1536,8,128,2,2,balanced,3.7744054794311523
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,4096,1536,8,128,2,2,power_law_1.2,3.1354816436767576
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,4096,1536,8,128,2,2,power_law_1.01,8.961529541015626
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,4096,1536,8,128,2,2,power_law_1.2,3.5279232025146485
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,4096,1536,8,128,2,2,power_law_1.01,16.569734191894533
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,4096,1536,8,128,2,2,power_law_1.2,5.907289505004883
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,4096,1536,8,128,2,2,power_law_1.2,11.898751831054687
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,4096,1536,8,128,2,2,balanced,4.68828805287679
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,4096,1536,8,128,2,2,balanced,8.976202646891275
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,4096,1536,8,128,2,2,balanced,7.727045059204102
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,4096,1536,8,128,2,2,balanced,7.473936080932617
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,4096,1536,8,128,2,2,power_law_1.2,0.04764800071716309
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,4096,1536,8,128,2,2,power_law_1.2,0.043628799915313723
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,4096,1536,8,128,2,2,power_law_1.2,0.05690240263938904
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,4096,1536,8,128,2,2,power_law_1.2,0.07507839798927307
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,4096,1536,8,128,2,2,power_law_1.2,0.09445120096206665
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,4096,1536,8,128,2,2,power_law_1.2,0.15745279788970948
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,4096,1536,8,128,2,2,power_law_1.2,0.16510720252990724
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,4096,1536,8,128,2,2,power_law_1.2,0.17230720520019532
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,4096,1536,8,128,2,2,power_law_1.2,0.17649279832839965
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,4096,1536,8,128,2,2,power_law_1.2,0.1783360004425049
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,4096,1536,8,128,2,2,power_law_1.2,0.19233280420303345
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,4096,1536,8,128,2,2,power_law_1.2,0.0579584002494812
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,4096,1536,8,128,2,2,power_law_1.2,0.19846400022506713
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,4096,1536,8,128,2,2,power_law_1.2,0.05464320182800293
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,4096,1536,8,128,2,2,power_law_1.2,0.20256640911102294
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,4096,1536,8,128,2,2,balanced,14.915130615234375
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,4096,1536,8,128,2,2,power_law_1.2,0.0645632028579712
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,4096,1536,8,128,2,2,power_law_1.2,0.20927999019622803
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,4096,1536,8,128,2,2,power_law_1.2,0.08513919711112976
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,4096,1536,8,128,4,1,balanced,0.049402669072151184
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,4096,1536,8,128,2,2,power_law_1.2,0.2247551918029785
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,4096,1536,8,128,2,2,power_law_1.2,0.09972479939460754
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,4096,1536,8,128,4,1,balanced,0.06418666740258534
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,4096,1536,8,128,2,2,power_law_1.2,0.23765759468078612
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,4096,1536,8,128,4,1,balanced,0.09912000099817912
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,4096,1536,8,128,2,2,power_law_1.2,0.16183040142059327
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,4096,1536,8,128,2,2,power_law_1.2,0.2404223918914795
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,4096,1536,8,128,2,2,power_law_1.2,0.17280639410018922
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,4096,1536,8,128,4,1,balanced,0.17488000790278116
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,4096,1536,8,128,2,2,power_law_1.2,0.2736063957214355
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,4096,1536,8,128,2,2,power_law_1.2,0.1863935947418213
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,4096,1536,8,128,4,1,balanced,0.3078186710675557
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,4096,1536,8,128,2,2,power_law_1.2,0.31794559955596924
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,4096,1536,8,128,4,1,balanced,0.31455467144648236
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,4096,1536,8,128,2,2,power_law_1.2,0.18881280422210694
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,4096,1536,8,128,2,2,power_law_1.2,0.3873471975326538
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,4096,1536,8,128,4,1,balanced,0.3150773247083028
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,4096,1536,8,128,2,2,power_law_1.2,0.20239360332489015
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,4096,1536,8,128,2,2,power_law_1.2,0.4286719799041748
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,4096,1536,8,128,4,1,balanced,0.3162026604016622
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,4096,1536,8,128,2,2,power_law_1.2,0.21267199516296387
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,4096,1536,8,128,2,2,power_law_1.2,0.5708288192749024
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,4096,1536,8,128,4,1,balanced,0.3171573281288147
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,4096,1536,8,128,2,2,power_law_1.2,0.2221695899963379
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,4096,1536,8,128,2,2,power_law_1.2,0.6674240112304688
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,4096,1536,8,128,4,1,balanced,0.31866133213043213
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,4096,1536,8,128,2,2,power_law_1.2,0.23864319324493408
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,4096,1536,8,128,4,1,balanced,0.3240213394165039
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,4096,1536,8,128,2,2,power_law_1.2,0.9947967529296875
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,4096,1536,8,128,2,2,power_law_1.2,0.2593919992446899
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,4096,1536,8,128,4,1,balanced,0.3288639982541402
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,4096,1536,8,128,2,2,power_law_1.2,1.2791808128356934
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,4096,1536,8,128,4,1,balanced,0.33238933483759564
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,4096,1536,8,128,2,2,power_law_1.2,1.7585344314575195
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,4096,1536,8,128,2,2,power_law_1.2,0.273305606842041
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,4096,1536,8,128,4,1,balanced,0.34141866366068524
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,4096,1536,8,128,2,2,power_law_1.2,0.2842303991317749
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,4096,1536,8,128,4,1,balanced,0.3585866689682007
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,4096,1536,8,128,2,2,power_law_1.2,2.183635139465332
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,4096,1536,8,128,4,1,balanced,0.366213321685791
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,4096,1536,8,128,2,2,power_law_1.2,2.8360383987426756
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,4096,1536,8,128,4,1,balanced,0.38419198989868164
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,4096,1536,8,128,2,2,power_law_1.2,0.31106560230255126
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,4096,1536,8,128,2,2,power_law_1.2,4.91789436340332
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,4096,1536,8,128,4,1,balanced,0.42313067118326825
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,4096,1536,8,128,2,2,power_law_1.2,0.3559168100357056
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,4096,1536,8,128,4,1,balanced,0.44946666558583576
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,4096,1536,8,128,2,2,power_law_1.2,0.45839362144470214
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,4096,1536,8,128,2,2,power_law_1.2,10.116806030273438
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,4096,1536,8,128,2,2,power_law_1.2,0.58853759765625
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,4096,1536,8,128,4,1,balanced,0.5067466497421265
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,4096,1536,8,128,2,2,power_law_1.2,0.6809152126312256
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,4096,1536,8,128,2,2,power_law_1.2,1.0059264183044434
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,4096,1536,8,128,4,1,balanced,0.5922240018844604
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,4096,1536,8,128,2,2,power_law_1.2,1.3167360305786133
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,4096,1536,8,128,2,2,power_law_1.2,1.8381311416625976
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,4096,1536,8,128,4,1,balanced,0.748965342839559
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,4096,1536,8,128,2,2,power_law_1.2,2.270528030395508
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,4096,1536,8,128,2,2,power_law_1.2,3.645004653930664
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,4096,1536,8,128,4,1,balanced,0.862885316212972
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,4096,1536,8,128,4,1,balanced,0.039290666580200195
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,4096,1536,8,128,2,2,power_law_1.2,4.592723083496094
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,4096,1536,8,128,4,1,balanced,0.05143466591835022
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,4096,1536,8,128,4,1,balanced,0.07216533521811168
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,4096,1536,8,128,2,2,power_law_1.2,6.065958404541016
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,4096,1536,8,128,4,1,balanced,1.2292693456013997
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,4096,1536,8,128,4,1,balanced,0.11541866262753804
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,4096,1536,8,128,4,1,balanced,0.19220799207687378
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,4096,1536,8,128,2,2,power_law_1.2,9.057817840576172
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,4096,1536,8,128,4,1,balanced,0.1943999926249186
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,4096,1536,8,128,4,1,balanced,0.19546133279800415
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,4096,1536,8,128,4,1,balanced,0.19478400548299155
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,4096,1536,8,128,2,2,power_law_1.2,19.28540802001953
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,4096,1536,8,128,4,1,balanced,1.615946610768636
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,4096,1536,8,128,4,1,power_law_1.01,0.04650239944458008
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,4096,1536,8,128,4,1,balanced,0.07009066641330719
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,4096,1536,8,128,4,1,balanced,0.20069867372512817
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,4096,1536,8,128,4,1,balanced,0.20252267519632974
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,4096,1536,8,128,4,1,power_law_1.01,0.05492479801177978
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,4096,1536,8,128,4,1,balanced,0.07436266541481018
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,4096,1536,8,128,4,1,balanced,0.20483199755350748
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,4096,1536,8,128,4,1,balanced,0.09226666887601216
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,4096,1536,8,128,4,1,power_law_1.01,0.07971839904785157
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,4096,1536,8,128,4,1,balanced,0.2092533310254415
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,4096,1536,8,128,4,1,balanced,0.13100799918174744
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,4096,1536,8,128,4,1,power_law_1.01,0.12030080556869507
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,4096,1536,8,128,4,1,balanced,0.21335999170939127
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,4096,1536,8,128,4,1,balanced,0.20844266812006632
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,4096,1536,8,128,4,1,power_law_1.01,0.17091200351715088
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,4096,1536,8,128,4,1,balanced,2.415226618448893
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,4096,1536,8,128,4,1,balanced,0.2225546638170878
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,4096,1536,8,128,4,1,balanced,0.21407999595006308
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,4096,1536,8,128,4,1,power_law_1.01,0.2653183937072754
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,4096,1536,8,128,4,1,power_law_1.01,0.037868800759315493
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,4096,1536,8,128,4,1,balanced,0.22206399838129678
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,4096,1536,8,128,4,1,balanced,0.23256532351175943
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,4096,1536,8,128,4,1,power_law_1.01,0.28009600639343263
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,4096,1536,8,128,4,1,power_law_1.01,0.04284160137176514
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,4096,1536,8,128,4,1,balanced,0.22266133626302084
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,4096,1536,8,128,4,1,balanced,0.24060799678166708
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,4096,1536,8,128,4,1,power_law_1.01,0.28954238891601564
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,4096,1536,8,128,4,1,power_law_1.01,0.06346240043640136
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,4096,1536,8,128,4,1,balanced,0.23106133937835693
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,4096,1536,8,128,4,1,balanced,0.26684800783793133
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,4096,1536,8,128,4,1,power_law_1.01,0.2937279939651489
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,4096,1536,8,128,4,1,power_law_1.01,0.08238080143928528
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,4096,1536,8,128,4,1,balanced,0.23758933941523233
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,4096,1536,8,128,4,1,power_law_1.01,0.10592639446258545
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,4096,1536,8,128,4,1,power_law_1.01,0.30817279815673826
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,4096,1536,8,128,4,1,balanced,0.3000640074412028
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,4096,1536,8,128,4,1,balanced,0.24209066232045492
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,4096,1536,8,128,4,1,balanced,3.228783925374349
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,4096,1536,8,128,4,1,power_law_1.01,0.1650879979133606
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,4096,1536,8,128,4,1,power_law_1.01,0.3191359996795654
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,4096,1536,8,128,4,1,balanced,0.2540000081062317
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,4096,1536,8,128,4,1,balanced,0.330186665058136
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,4096,1536,8,128,4,1,power_law_1.01,0.17167359590530396
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,4096,1536,8,128,4,1,power_law_1.01,0.3288831949234009
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,4096,1536,8,128,4,1,balanced,0.25835732618967694
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,4096,1536,8,128,4,1,power_law_1.01,0.1815168023109436
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,4096,1536,8,128,4,1,power_law_1.01,0.3616640090942383
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,4096,1536,8,128,4,1,balanced,0.3847413460413615
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,4096,1536,8,128,4,1,balanced,0.27559467156728107
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,4096,1536,8,128,4,1,power_law_1.01,0.18540159463882447
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,4096,1536,8,128,4,1,power_law_1.01,0.34766080379486086
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,4096,1536,8,128,4,1,balanced,0.43698132038116455
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,4096,1536,8,128,4,1,power_law_1.01,0.19341440200805665
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,4096,1536,8,128,4,1,power_law_1.01,0.37985920906066895
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,4096,1536,8,128,4,1,power_law_1.01,0.20183680057525635
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,4096,1536,8,128,4,1,power_law_1.01,0.4001279830932617
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,4096,1536,8,128,4,1,balanced,0.6296159823735555
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,4096,1536,8,128,4,1,balanced,0.2997866670290629
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,4096,1536,8,128,4,1,power_law_1.01,0.21463680267333984
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,4096,1536,8,128,4,1,power_law_1.01,0.41631360054016114
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,4096,1536,8,128,4,1,power_law_1.01,0.22653439044952392
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,4096,1536,8,128,4,1,balanced,0.31350932518641156
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,4096,1536,8,128,4,1,balanced,4.014309247334798
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,4096,1536,8,128,4,1,power_law_1.01,0.49109759330749514
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,4096,1536,8,128,4,1,power_law_1.01,0.22816638946533202
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,4096,1536,8,128,4,1,balanced,0.7703466415405273
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,4096,1536,8,128,4,1,power_law_1.01,0.5087552070617676
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,4096,1536,8,128,4,1,power_law_1.01,0.24747519493103026
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,4096,1536,8,128,4,1,power_law_1.01,0.5902336120605469
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,4096,1536,8,128,4,1,power_law_1.01,0.2615423917770386
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,4096,1536,8,128,4,1,power_law_1.01,0.7042367935180665
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,4096,1536,8,128,4,1,power_law_1.01,0.28365440368652345
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,4096,1536,8,128,4,1,balanced,1.1151786645253499
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,4096,1536,8,128,4,1,power_law_1.01,0.33164799213409424
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,4096,1536,8,128,4,1,balanced,0.3863946596781413
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,4096,1536,8,128,4,1,power_law_1.01,0.8625023841857911
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,4096,1536,8,128,4,1,power_law_1.01,0.3635839939117432
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,4096,1536,8,128,4,1,power_law_1.01,1.000716781616211
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,4096,1536,8,128,4,1,balanced,0.4799199899037679
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,4096,1536,8,128,4,1,power_law_1.01,0.439961576461792
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,4096,1536,8,128,4,1,power_law_1.01,1.3504128456115723
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,4096,1536,8,128,4,1,balanced,0.5251359939575195
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,4096,1536,8,128,4,1,power_law_1.01,0.5161280155181884
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,4096,1536,8,128,4,1,balanced,1.4692427317301433
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,4096,1536,8,128,4,1,power_law_1.01,1.700307273864746
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,4096,1536,8,128,4,1,power_law_1.01,0.6700607776641846
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,4096,1536,8,128,4,1,balanced,0.7295306523640951
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,4096,1536,8,128,4,1,power_law_1.01,0.8168512344360351
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,4096,1536,8,128,4,1,power_law_1.01,2.470822334289551
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,4096,1536,8,128,4,1,power_law_1.01,1.1413632392883302
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,4096,1536,8,128,4,1,balanced,0.8549919923146566
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,4096,1536,8,128,4,1,power_law_1.01,3.22305908203125
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,4096,1536,8,128,4,1,power_law_1.01,1.4737983703613282
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,4096,1536,8,128,4,1,balanced,6.0472157796223955
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,4096,1536,8,128,4,1,power_law_1.01,3.9760833740234376
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,4096,1536,8,128,4,1,balanced,2.194704055786133
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,4096,1536,8,128,4,1,power_law_1.01,2.1437183380126954
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,4096,1536,8,128,4,1,balanced,1.3266719977060955
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,4096,1536,8,128,4,1,power_law_1.01,2.8212928771972656
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,4096,1536,8,128,4,1,power_law_1.01,6.209881591796875
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,4096,1536,8,128,4,1,balanced,1.6061973571777344
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,4096,1536,8,128,4,1,power_law_1.01,3.4835136413574217
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,4096,1536,8,128,4,1,power_law_1.01,13.090457153320312
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,4096,1536,8,128,4,1,power_law_1.01,5.626630401611328
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,4096,1536,8,128,4,1,balanced,2.3655412991841636
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,4096,1536,8,128,4,1,power_law_1.01,11.709241485595703
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,4096,1536,8,128,4,1,balanced,2.929178555806478
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,4096,1536,8,128,4,1,power_law_1.01,0.06071680188179016
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,4096,1536,8,128,4,1,balanced,3.1222718556722007
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,4096,1536,8,128,4,1,power_law_1.01,0.07083520293235779
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,4096,1536,8,128,4,1,power_law_1.01,0.08331519961357117
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,4096,1536,8,128,4,1,power_law_1.01,0.10215040445327758
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,4096,1536,8,128,4,1,power_law_1.01,0.13266559839248657
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,4096,1536,8,128,4,1,power_law_1.01,0.18572160005569457
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,4096,1536,8,128,4,1,power_law_1.01,0.19747840166091918
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,4096,1536,8,128,4,1,balanced,3.663498560587565
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,4096,1536,8,128,4,1,power_law_1.01,0.20184319019317626
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,4096,1536,8,128,4,1,balanced,4.644538561503093
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,4096,1536,8,128,4,1,power_law_1.01,0.21580159664154053
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,4096,1536,8,128,4,1,power_law_1.01,0.2248768091201782
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,4096,1536,8,128,4,1,power_law_1.01,0.24339840412139893
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,4096,1536,8,128,4,1,power_law_1.01,0.2648128032684326
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,4096,1536,8,128,4,1,power_law_1.01,0.2769407987594604
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,4096,1536,8,128,4,1,power_law_1.01,0.31024000644683836
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,4096,1536,8,128,4,1,power_law_1.01,0.33171839714050294
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,4096,1536,8,128,4,1,power_law_1.01,0.36036479473114014
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,4096,1536,8,128,4,1,balanced,6.157573064168294
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,4096,1536,8,128,4,1,balanced,12.190053304036459
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,4096,1536,8,128,4,1,power_law_1.01,0.39327359199523926
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,4096,1536,8,128,4,1,power_law_1.01,0.5034687995910645
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,4096,1536,8,128,4,1,power_law_1.01,0.594374418258667
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,4096,1536,8,128,4,1,power_law_1.2,0.0471807986497879
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,4096,1536,8,128,4,1,power_law_1.01,0.7761087894439698
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,4096,1536,8,128,4,1,power_law_1.01,0.9561344146728515
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,4096,1536,8,128,4,1,balanced,5.566272099812825
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,4096,1536,8,128,4,1,power_law_1.2,0.052902400493621826
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,4096,1536,8,128,4,1,power_law_1.01,1.3339712142944335
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,4096,1536,8,128,4,1,power_law_1.01,1.7093824386596679
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,4096,1536,8,128,4,1,power_law_1.2,0.0744704008102417
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,4096,1536,8,128,4,1,power_law_1.01,2.4571136474609374
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,4096,1536,8,128,4,1,power_law_1.2,0.11025919914245605
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,4096,1536,8,128,4,1,power_law_1.01,3.2036033630371095
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,4096,1536,8,128,4,1,balanced,7.6444746653238935
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,4096,1536,8,128,4,1,power_law_1.2,0.15918079614639283
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,4096,1536,8,128,4,1,power_law_1.01,4.685798263549804
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,4096,1536,8,128,4,1,power_law_1.2,0.26881918907165525
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,4096,1536,8,128,4,1,power_law_1.01,6.179385757446289
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,4096,1536,8,128,4,1,power_law_1.2,0.28409600257873535
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,4096,1536,8,128,4,1,power_law_1.01,7.671814727783203
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,4096,1536,8,128,4,1,power_law_1.2,0.2955904006958008
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,4096,1536,8,128,4,1,power_law_1.2,0.3012671947479248
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,4096,1536,8,128,4,1,power_law_1.01,12.156684875488281
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,4096,1536,8,128,4,1,power_law_1.2,0.309555196762085
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,4096,1536,8,128,4,1,power_law_1.2,0.33162879943847656
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,4096,1536,8,128,4,1,power_law_1.2,0.3411839962005615
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,4096,1536,8,128,4,1,power_law_1.01,24.113095092773438
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,4096,1536,8,128,4,1,power_law_1.2,0.3641535997390747
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,4096,1536,8,128,4,1,power_law_1.2,0.3634624004364014
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,4096,1536,8,128,4,1,power_law_1.2,0.03761920034885406
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,4096,1536,8,128,4,1,power_law_1.2,0.39083518981933596
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,4096,1536,8,128,4,1,power_law_1.2,0.042752000689506534
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,4096,1536,8,128,4,1,power_law_1.2,0.4062079906463623
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,4096,1536,8,128,4,1,power_law_1.2,0.05953279733657837
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,4096,1536,8,128,4,1,power_law_1.2,0.42310400009155275
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,4096,1536,8,128,4,1,power_law_1.2,0.07930240035057068
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,4096,1536,8,128,4,1,power_law_1.2,0.48699522018432617
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,4096,1536,8,128,4,1,power_law_1.2,0.10206079483032227
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,4096,1536,8,128,4,1,balanced,12.159557342529297
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,4096,1536,8,128,4,1,power_law_1.2,0.5120960235595703
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,4096,1536,8,128,4,1,power_law_1.2,0.16159360408782958
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,4096,1536,8,128,4,1,power_law_1.2,0.5954048156738281
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,4096,1536,8,128,4,1,power_law_1.2,0.17626240253448486
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,4096,1536,8,128,4,1,power_law_1.2,0.7097343921661377
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,4096,1536,8,128,4,1,power_law_1.2,0.18634239435195923
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,4096,1536,8,128,4,1,power_law_1.2,0.18773759603500367
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,4096,1536,8,128,4,1,power_law_1.2,0.8992192268371582
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,4096,1536,8,128,4,1,power_law_1.2,0.19660799503326415
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,4096,1536,8,128,4,1,power_law_1.2,1.010476779937744
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,4096,1536,8,128,4,1,power_law_1.2,0.20803840160369874
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,4096,1536,8,128,4,1,balanced,11.097872416178385
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,4096,1536,8,128,4,1,power_law_1.2,1.3842368125915527
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,4096,1536,8,128,4,1,power_law_1.2,0.2221440076828003
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,4096,1536,8,128,4,1,power_law_1.2,0.23009281158447265
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,4096,1536,8,128,4,1,power_law_1.2,1.7356159210205078
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,4096,1536,8,128,4,1,power_law_1.2,0.23598079681396483
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,4096,1536,8,128,4,1,power_law_1.2,2.512883186340332
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,4096,1536,8,128,4,1,power_law_1.2,0.2454848051071167
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,4096,1536,8,128,4,1,power_law_1.2,3.250137710571289
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,4096,1536,8,128,4,1,power_law_1.2,0.2619647979736328
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,4096,1536,8,128,4,1,power_law_1.2,3.9689918518066407
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,4096,1536,8,128,4,1,power_law_1.2,0.2864959955215454
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,4096,1536,8,128,4,1,power_law_1.2,0.33304319381713865
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,4096,1536,8,128,4,1,power_law_1.2,6.224345779418945
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,4096,1536,8,128,4,1,power_law_1.2,0.36567680835723876
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,4096,1536,8,128,4,1,power_law_1.2,0.4418623924255371
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,4096,1536,8,128,4,1,power_law_1.2,13.156979370117188
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,4096,1536,8,128,4,1,power_law_1.2,0.5238912105560303
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,4096,1536,8,128,4,1,power_law_1.2,0.6780223846435547
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,4096,1536,8,128,4,1,power_law_1.2,0.8303487777709961
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,4096,1536,8,128,4,1,power_law_1.2,1.1537728309631348
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,4096,1536,8,128,4,1,power_law_1.2,1.4910592079162597
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,4096,1536,8,128,4,1,power_law_1.2,2.1598016738891603
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,4096,1536,8,128,4,1,power_law_1.2,2.8392383575439455
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,4096,1536,8,128,4,1,balanced,24.246564229329426
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,4096,1536,8,128,4,1,power_law_1.2,3.5186431884765623
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,4096,1536,8,128,4,1,power_law_1.2,5.837510299682617
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,4096,1536,8,128,4,1,power_law_1.2,11.816371154785156
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,4096,1536,8,128,4,1,power_law_1.2,0.06211199760437012
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,4096,1536,8,128,4,1,power_law_1.2,0.07146239876747132
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,4096,1536,8,128,4,1,power_law_1.2,0.07899519801139832
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,4096,1536,8,128,4,1,power_law_1.2,0.10000640153884888
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,6144,2560,8,160,1,4,balanced,0.0943999985853831
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,4096,1536,8,128,4,1,power_law_1.2,0.12414079904556274
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,6144,2560,8,160,1,4,balanced,0.12468799948692322
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,6144,2560,8,160,1,4,balanced,0.21940267086029053
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,4096,1536,8,128,4,1,power_law_1.2,0.18532480001449586
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,6144,2560,8,160,1,4,balanced,0.3959999879201253
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,4096,1536,8,128,4,1,power_law_1.2,0.1976256012916565
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,6144,2560,8,160,1,4,balanced,0.7368106842041016
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,4096,1536,8,128,4,1,power_law_1.2,0.21332480907440185
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,6144,2560,8,160,1,4,balanced,0.9235626856486002
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,4096,1536,8,128,4,1,power_law_1.2,0.2197887897491455
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,6144,2560,8,160,1,4,balanced,0.9278186957041422
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,4096,1536,8,128,4,1,power_law_1.2,0.23330559730529785
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,6144,2560,8,160,1,4,balanced,0.9256587028503418
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,4096,1536,8,128,4,1,power_law_1.2,0.24674561023712158
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,6144,2560,8,160,1,4,balanced,0.9307680130004883
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,4096,1536,8,128,4,1,power_law_1.2,0.2671488046646118
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,6144,2560,8,160,1,4,balanced,0.9304426511128744
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,4096,1536,8,128,4,1,power_law_1.2,0.2827967882156372
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,6144,2560,8,160,1,4,balanced,0.9203519821166992
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,4096,1536,8,128,4,1,power_law_1.2,0.3138047933578491
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,6144,2560,8,160,1,4,balanced,0.9326612949371338
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,6144,2560,8,160,1,4,balanced,0.9325066407521566
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,6144,2560,8,160,1,4,balanced,0.06846400101979573
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,4096,1536,8,128,4,1,power_law_1.2,0.33077120780944824
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,6144,2560,8,160,1,4,balanced,0.9438186486562093
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,6144,2560,8,160,1,4,balanced,0.09013332923253377
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,4096,1536,8,128,4,1,power_law_1.2,0.3593983888626099
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,6144,2560,8,160,1,4,balanced,0.9528373082478842
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,6144,2560,8,160,1,4,balanced,0.13179733355840048
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,6144,2560,8,160,1,4,balanced,0.9642240206400553
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,6144,2560,8,160,1,4,balanced,0.22075732549031576
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,6144,2560,8,160,1,4,balanced,0.3975359996159871
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,6144,2560,8,160,1,4,balanced,0.9734613100687662
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,4096,1536,8,128,4,1,power_law_1.2,0.4008959770202637
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,6144,2560,8,160,1,4,balanced,0.4814506769180298
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,6144,2560,8,160,1,4,balanced,1.0188586711883545
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,4096,1536,8,128,4,1,power_law_1.2,0.5081151962280274
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,6144,2560,8,160,1,4,balanced,0.48709332942962646
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,4096,1536,8,128,4,1,power_law_1.2,0.6045567989349365
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,6144,2560,8,160,1,4,balanced,1.0274186929066975
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,6144,2560,8,160,1,4,balanced,0.48704532782236737
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,4096,1536,8,128,4,1,power_law_1.2,0.7861824035644531
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,6144,2560,8,160,1,4,balanced,0.488261342048645
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,6144,2560,8,160,1,4,balanced,1.3279679616292317
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,4096,1536,8,128,4,1,power_law_1.2,0.9674688339233398
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,6144,2560,8,160,1,4,balanced,0.49198933442433673
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,6144,2560,8,160,1,4,balanced,0.49564798672993976
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,6144,2560,8,160,1,4,balanced,1.1264053185780842
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,4096,1536,8,128,4,1,power_law_1.2,1.3496319770812988
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,6144,2560,8,160,1,4,balanced,0.4975466728210449
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,4096,1536,8,128,4,1,power_law_1.2,1.714124870300293
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,6144,2560,8,160,1,4,balanced,0.5020106633504232
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,6144,2560,8,160,1,4,balanced,1.973973274230957
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,6144,2560,8,160,1,4,balanced,0.5125013192494711
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,4096,1536,8,128,4,1,power_law_1.2,2.468217658996582
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,6144,2560,8,160,1,4,balanced,0.5216906468073527
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,4096,1536,8,128,4,1,power_law_1.2,3.2146305084228515
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,6144,2560,8,160,1,4,balanced,0.5287359952926636
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,6144,2560,8,160,1,4,balanced,1.4721706708272297
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,4096,1536,8,128,4,1,power_law_1.2,4.692512130737304
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,6144,2560,8,160,1,4,balanced,0.5388373136520386
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,4096,1536,8,128,4,1,power_law_1.2,6.190828704833985
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,6144,2560,8,160,1,4,balanced,0.5774293343226115
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,6144,2560,8,160,1,4,balanced,2.689093271891276
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,6144,2560,8,160,1,4,balanced,0.5800533294677734
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,4096,1536,8,128,4,1,power_law_1.2,7.685081481933594
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,6144,2560,8,160,1,4,balanced,0.06807466844717662
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,6144,2560,8,160,1,4,balanced,0.09119466940561931
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,6144,2560,8,160,1,4,balanced,0.7780746618906657
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,4096,1536,8,128,4,1,power_law_1.2,12.151315307617187
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,6144,2560,8,160,1,4,balanced,0.13315199812253317
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,6144,2560,8,160,1,4,balanced,0.22699199120203653
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,6144,2560,8,160,1,4,balanced,0.6726933320363363
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,6144,2560,8,160,1,4,balanced,0.3977706829706828
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,6144,2560,8,160,1,4,balanced,2.7221225102742515
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,6144,2560,8,160,1,4,balanced,0.49024001757303876
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,4096,1536,8,128,4,1,power_law_1.2,24.129600524902344
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,6144,2560,8,160,1,4,balanced,0.49511468410491943
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,6144,2560,8,160,1,4,balanced,1.1299946308135986
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,6144,2560,8,160,1,4,balanced,0.4949920177459717
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,6144,2560,8,160,1,4,balanced,0.4983146588007609
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,6144,2560,8,160,1,4,balanced,0.49929598967234295
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,6144,2560,8,160,1,4,balanced,0.5058559974034628
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,6144,2560,8,160,1,4,balanced,0.9546879927317301
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,6144,2560,8,160,1,4,balanced,0.5095733404159546
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,6144,2560,8,160,1,4,power_law_1.01,0.23014400005340577
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,6144,2560,8,160,1,4,balanced,3.413658777872721
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,6144,2560,8,160,1,4,balanced,0.5155733426411947
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,6144,2560,8,160,1,4,balanced,0.5247999827067057
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,6144,2560,8,160,1,4,power_law_1.01,0.3855488061904907
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,6144,2560,8,160,1,4,balanced,0.5385866562525431
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,6144,2560,8,160,1,4,balanced,1.6422665913899739
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,6144,2560,8,160,1,4,power_law_1.01,0.22370560169219972
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,6144,2560,8,160,1,4,power_law_1.01,0.33615999221801757
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,6144,2560,8,160,1,4,power_law_1.01,0.4254144191741943
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,6144,2560,8,160,1,4,power_law_1.01,0.7343679904937744
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,6144,2560,8,160,1,4,balanced,0.5497066577275594
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,6144,2560,8,160,1,4,power_law_1.01,0.7635519981384278
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,6144,2560,8,160,1,4,balanced,1.8164745966593425
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,6144,2560,8,160,1,4,power_law_1.01,0.7797823905944824
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,6144,2560,8,160,1,4,balanced,4.654272079467773
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,6144,2560,8,160,1,4,power_law_1.01,0.823027229309082
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,6144,2560,8,160,1,4,power_law_1.01,0.13176319599151612
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,6144,2560,8,160,1,4,power_law_1.01,0.84268798828125
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,6144,2560,8,160,1,4,power_law_1.01,0.18765439987182617
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,6144,2560,8,160,1,4,power_law_1.01,0.8554495811462403
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,6144,2560,8,160,1,4,balanced,0.5685973167419434
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,6144,2560,8,160,1,4,power_law_1.01,0.9274239540100098
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,6144,2560,8,160,1,4,power_law_1.01,0.1254464030265808
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,6144,2560,8,160,1,4,power_law_1.01,0.9350399971008301
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,6144,2560,8,160,1,4,power_law_1.01,0.19163520336151124
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,6144,2560,8,160,1,4,balanced,2.3321812947591147
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,6144,2560,8,160,1,4,power_law_1.01,0.9174400329589844
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,6144,2560,8,160,1,4,power_law_1.01,0.24690558910369872
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,6144,2560,8,160,1,4,power_law_1.01,0.9912575721740723
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,6144,2560,8,160,1,4,power_law_1.01,0.37079041004180907
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,6144,2560,8,160,1,4,power_law_1.01,1.0297151565551759
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,6144,2560,8,160,1,4,power_law_1.01,0.42405118942260744
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,6144,2560,8,160,1,4,power_law_1.01,1.060966396331787
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,6144,2560,8,160,1,4,power_law_1.01,0.42167038917541505
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,6144,2560,8,160,1,4,balanced,5.3819840749104815
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,6144,2560,8,160,1,4,power_law_1.01,1.2239808082580566
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,6144,2560,8,160,1,4,balanced,0.620138684908549
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,6144,2560,8,160,1,4,power_law_1.01,0.44405760765075686
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,6144,2560,8,160,1,4,power_law_1.01,1.294700813293457
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,6144,2560,8,160,1,4,power_law_1.01,0.4337024211883545
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,6144,2560,8,160,1,4,balanced,0.6601333220799764
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,6144,2560,8,160,1,4,power_law_1.01,1.478502368927002
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,6144,2560,8,160,1,4,power_law_1.01,0.4773439884185791
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,6144,2560,8,160,1,4,balanced,3.215573310852051
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,6144,2560,8,160,1,4,balanced,0.7850613594055176
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,6144,2560,8,160,1,4,power_law_1.01,1.6909824371337892
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,6144,2560,8,160,1,4,power_law_1.01,0.48575358390808104
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,6144,2560,8,160,1,4,balanced,0.8689280351003011
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,6144,2560,8,160,1,4,power_law_1.01,2.062860870361328
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,6144,2560,8,160,1,4,power_law_1.01,0.5143424034118652
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,6144,2560,8,160,1,4,power_law_1.01,2.3717248916625975
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,6144,2560,8,160,1,4,power_law_1.01,0.4902463912963867
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,6144,2560,8,160,1,4,balanced,1.3067519664764404
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,6144,2560,8,160,1,4,power_law_1.01,0.5347392082214355
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,6144,2560,8,160,1,4,power_law_1.01,3.2175487518310546
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,6144,2560,8,160,1,4,power_law_1.01,0.5629119873046875
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,6144,2560,8,160,1,4,power_law_1.01,0.14298880100250244
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,6144,2560,8,160,1,4,balanced,1.4708372751871746
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,6144,2560,8,160,1,4,power_law_1.01,3.2998016357421873
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,6144,2560,8,160,1,4,power_law_1.01,0.562559986114502
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,6144,2560,8,160,1,4,power_law_1.01,0.16035840511322022
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,6144,2560,8,160,1,4,power_law_1.01,5.122463989257812
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,6144,2560,8,160,1,4,power_law_1.01,0.6592832088470459
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,6144,2560,8,160,1,4,power_law_1.01,0.133241605758667
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,6144,2560,8,160,1,4,balanced,2.143498738606771
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,6144,2560,8,160,1,4,balanced,3.554282824198405
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,6144,2560,8,160,1,4,power_law_1.01,6.391916656494141
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,6144,2560,8,160,1,4,power_law_1.01,0.6988736152648926
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,6144,2560,8,160,1,4,power_law_1.2,0.23061759471893312
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,6144,2560,8,160,1,4,power_law_1.01,0.18135679960250856
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,6144,2560,8,160,1,4,power_law_1.01,0.8656000137329102
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,6144,2560,8,160,1,4,power_law_1.2,0.18553600311279297
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,6144,2560,8,160,1,4,power_law_1.01,0.24750080108642578
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,6144,2560,8,160,1,4,power_law_1.01,7.286847686767578
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,6144,2560,8,160,1,4,balanced,8.944778442382812
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,6144,2560,8,160,1,4,power_law_1.01,0.9467264175415039
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,6144,2560,8,160,1,4,power_law_1.2,0.168614399433136
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,6144,2560,8,160,1,4,power_law_1.01,0.3944767951965332
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,6144,2560,8,160,1,4,balanced,2.8201119105021157
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,6144,2560,8,160,1,4,power_law_1.01,11.308595275878906
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,6144,2560,8,160,1,4,power_law_1.01,1.1753984451293946
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,6144,2560,8,160,1,4,power_law_1.2,0.29117441177368164
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,6144,2560,8,160,1,4,power_law_1.01,0.4137728214263916
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,6144,2560,8,160,1,4,power_law_1.2,0.39044480323791503
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,6144,2560,8,160,1,4,power_law_1.01,0.4480639934539795
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,6144,2560,8,160,1,4,power_law_1.01,1.4343104362487793
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,6144,2560,8,160,1,4,power_law_1.2,0.7469888210296631
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,6144,2560,8,160,1,4,power_law_1.01,0.44556798934936526
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,6144,2560,8,160,1,4,power_law_1.01,1.8337472915649413
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,6144,2560,8,160,1,4,power_law_1.01,22.865087890625
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,6144,2560,8,160,1,4,power_law_1.2,0.7621503829956054
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,6144,2560,8,160,1,4,power_law_1.01,0.4468224048614502
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,6144,2560,8,160,1,4,power_law_1.01,2.214387130737305
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,6144,2560,8,160,1,4,power_law_1.2,0.8470784187316894
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,6144,2560,8,160,1,4,power_law_1.01,0.5159103870391846
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,6144,2560,8,160,1,4,balanced,3.8630987803141275
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,6144,2560,8,160,1,4,power_law_1.01,3.0059200286865235
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,6144,2560,8,160,1,4,power_law_1.01,0.5281343936920166
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,6144,2560,8,160,1,4,power_law_1.2,0.8654720306396484
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,6144,2560,8,160,1,4,power_law_1.01,4.061689758300782
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,6144,2560,8,160,1,4,power_law_1.2,0.8642687797546387
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,6144,2560,8,160,1,4,power_law_1.01,0.5697152137756347
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,6144,2560,8,160,1,4,power_law_1.01,0.6267519950866699
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,6144,2560,8,160,1,4,power_law_1.2,0.9086015701293946
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,6144,2560,8,160,1,4,power_law_1.01,5.056351852416992
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,6144,2560,8,160,1,4,power_law_1.01,0.6620800018310546
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,6144,2560,8,160,1,4,power_law_1.2,0.8957504272460938
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,6144,2560,8,160,1,4,balanced,5.630271911621094
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,6144,2560,8,160,1,4,power_law_1.01,6.989536285400391
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,6144,2560,8,160,1,4,power_law_1.2,0.9838015556335449
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,6144,2560,8,160,1,4,balanced,5.2381439208984375
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,6144,2560,8,160,1,4,power_law_1.2,1.0012672424316407
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,6144,2560,8,160,1,4,power_law_1.01,0.6420479774475097
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,6144,2560,8,160,1,4,power_law_1.01,14.723500061035157
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,6144,2560,8,160,1,4,power_law_1.2,0.9839743614196778
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,6144,2560,8,160,1,4,power_law_1.2,1.0891648292541505
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,6144,2560,8,160,1,4,power_law_1.01,0.6909632205963134
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,6144,2560,8,160,1,4,power_law_1.2,1.135148811340332
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,6144,2560,8,160,1,4,power_law_1.2,1.3828224182128905
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,6144,2560,8,160,1,4,power_law_1.01,0.7013951778411865
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,6144,2560,8,160,1,4,power_law_1.2,1.4281791687011718
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,6144,2560,8,160,1,4,power_law_1.01,0.8340543746948242
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,6144,2560,8,160,1,4,power_law_1.2,1.6864959716796875
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,6144,2560,8,160,1,4,balanced,6.251237233479817
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,6144,2560,8,160,1,4,power_law_1.01,0.9807168006896972
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,6144,2560,8,160,1,4,power_law_1.2,1.8601856231689453
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,6144,2560,8,160,1,4,power_law_1.01,1.124332809448242
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,6144,2560,8,160,1,4,power_law_1.2,2.2310400009155273
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,6144,2560,8,160,1,4,power_law_1.01,1.531187152862549
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,6144,2560,8,160,1,4,power_law_1.2,2.521798324584961
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,6144,2560,8,160,1,4,power_law_1.01,1.9588735580444336
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,6144,2560,8,160,1,4,power_law_1.2,3.2205120086669923
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,6144,2560,8,160,1,4,balanced,18.244586944580078
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,6144,2560,8,160,1,4,power_law_1.01,2.9302976608276365
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,6144,2560,8,160,1,4,power_law_1.2,3.7448577880859375
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,6144,2560,8,160,1,4,power_law_1.01,3.742335891723633
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,6144,2560,8,160,1,4,power_law_1.2,5.135187149047852
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,6144,2560,8,160,1,4,power_law_1.01,5.362636947631836
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,6144,2560,8,160,1,4,power_law_1.2,7.429804992675781
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,6144,2560,8,160,1,4,power_law_1.01,6.634067535400391
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,6144,2560,8,160,1,4,power_law_1.2,9.632978820800782
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,6144,2560,8,160,1,4,power_law_1.01,8.125414276123047
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,6144,2560,8,160,1,4,balanced,10.204570770263672
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,6144,2560,8,160,1,4,power_law_1.2,14.541612243652343
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,6144,2560,8,160,1,4,power_law_1.01,12.943685913085938
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,6144,2560,8,160,1,4,balanced,11.758394877115885
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,6144,2560,8,160,1,4,power_law_1.01,28.896914672851562
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,6144,2560,8,160,1,4,power_law_1.2,30.96624755859375
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,6144,2560,8,160,1,4,power_law_1.2,0.14199680089950562
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,6144,2560,8,160,1,4,power_law_1.2,0.09904000163078308
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,6144,2560,8,160,1,4,power_law_1.2,0.11839359998703003
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,6144,2560,8,160,1,4,power_law_1.2,0.18700159788131715
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,6144,2560,8,160,1,4,power_law_1.2,0.22695679664611818
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,6144,2560,8,160,1,4,power_law_1.2,0.3712768077850342
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,6144,2560,8,160,1,4,power_law_1.2,0.41863040924072265
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,6144,2560,8,160,1,4,power_law_1.2,0.42086400985717776
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,6144,2560,8,160,1,4,power_law_1.2,0.4523712158203125
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,6144,2560,8,160,1,4,power_law_1.2,0.469708776473999
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,6144,2560,8,160,1,4,power_law_1.2,0.4740096092224121
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,6144,2560,8,160,1,4,power_law_1.2,0.4938176155090332
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,6144,2560,8,160,1,4,power_law_1.2,0.5366975784301757
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,6144,2560,8,160,1,4,power_law_1.2,0.5143871784210206
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,6144,2560,8,160,1,4,power_law_1.2,0.5594624042510986
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,6144,2560,8,160,1,4,balanced,20.71938196818034
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,6144,2560,8,160,1,4,power_law_1.2,0.5796544075012207
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,6144,2560,8,160,1,4,power_law_1.2,0.5908607959747314
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,6144,2560,8,160,1,4,power_law_1.2,0.7086400032043457
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,6144,2560,8,160,1,4,power_law_1.2,0.7435264110565185
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,6144,2560,8,160,1,4,power_law_1.2,0.9580415725708008
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,6144,2560,8,160,1,4,power_law_1.2,1.0393856048583985
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,6144,2560,8,160,1,4,power_law_1.2,1.396671962738037
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,6144,2560,8,160,1,4,power_law_1.2,1.5740351676940918
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,6144,2560,8,160,1,4,power_law_1.2,2.068364715576172
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,6144,2560,8,160,1,4,power_law_1.2,2.325331115722656
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,6144,2560,8,160,1,4,power_law_1.2,3.5740543365478517
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,6144,2560,8,160,1,4,power_law_1.2,4.350918579101562
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,6144,2560,8,160,1,4,power_law_1.2,5.750783920288086
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,6144,2560,8,160,1,4,power_law_1.2,9.886598205566406
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,6144,2560,8,160,1,4,power_law_1.2,18.309599304199217
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,6144,2560,8,160,1,4,power_law_1.2,0.14102400541305543
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,6144,2560,8,160,1,4,power_law_1.2,0.10289280414581299
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,6144,2560,8,160,1,4,power_law_1.2,0.133241605758667
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,6144,2560,8,160,1,4,power_law_1.2,0.17491840124130248
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,6144,2560,8,160,1,4,power_law_1.2,0.239084792137146
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,6144,2560,8,160,1,4,power_law_1.2,0.38724479675292967
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,6144,2560,8,160,1,4,power_law_1.2,0.4383872032165527
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,6144,2560,8,160,1,4,power_law_1.2,0.4264383792877197
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,6144,2560,8,160,1,4,power_law_1.2,0.44800639152526855
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,6144,2560,8,160,1,4,power_law_1.2,0.4846015930175781
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,6144,2560,8,160,2,2,balanced,0.09131733576456706
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,6144,2560,8,160,1,4,power_law_1.2,0.5234687805175782
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,6144,2560,8,160,2,2,balanced,0.1241919994354248
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,6144,2560,8,160,1,4,power_law_1.2,0.5304768085479736
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,6144,2560,8,160,2,2,balanced,0.21640533208847046
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,6144,2560,8,160,1,4,power_law_1.2,0.574892807006836
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,6144,2560,8,160,2,2,balanced,0.4005066553751628
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,6144,2560,8,160,1,4,power_law_1.2,0.6453567981719971
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,6144,2560,8,160,2,2,balanced,0.7349173227945963
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,6144,2560,8,160,1,4,power_law_1.2,0.6503359794616699
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,6144,2560,8,160,2,2,balanced,0.9313066800435384
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,6144,2560,8,160,2,2,balanced,0.06717866659164429
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,6144,2560,8,160,2,2,balanced,0.9397599697113037
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,6144,2560,8,160,2,2,balanced,0.9386933644612631
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,6144,2560,8,160,2,2,balanced,0.09033067027727763
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,6144,2560,8,160,1,4,power_law_1.2,0.6521471977233887
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,6144,2560,8,160,2,2,balanced,0.1309333344300588
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,6144,2560,8,160,2,2,balanced,0.9419253667195638
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,6144,2560,8,160,2,2,balanced,0.22137065728505453
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,6144,2560,8,160,2,2,balanced,0.9426399866739908
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,6144,2560,8,160,1,4,power_law_1.2,0.7247871875762939
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,6144,2560,8,160,2,2,balanced,0.3935626745223999
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,6144,2560,8,160,2,2,balanced,0.9342559973398844
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,6144,2560,8,160,2,2,balanced,0.48902400334676105
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,6144,2560,8,160,2,2,balanced,0.9510026772816976
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,6144,2560,8,160,2,2,balanced,0.4919999837875366
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,6144,2560,8,160,1,4,power_law_1.2,0.7428864002227783
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,6144,2560,8,160,2,2,balanced,0.49429865678151447
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,6144,2560,8,160,2,2,balanced,0.9444053173065186
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,6144,2560,8,160,2,2,balanced,0.4993813435236613
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,6144,2560,8,160,1,4,power_law_1.2,0.8899776458740234
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,6144,2560,8,160,2,2,balanced,0.9621067047119141
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,6144,2560,8,160,2,2,balanced,0.5014506578445435
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,6144,2560,8,160,1,4,power_law_1.2,1.0274239540100099
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,6144,2560,8,160,2,2,balanced,0.9685226281483968
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,6144,2560,8,160,2,2,balanced,0.5066986481348673
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,6144,2560,8,160,1,4,power_law_1.2,1.2089728355407714
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,6144,2560,8,160,2,2,balanced,0.9792373180389404
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,6144,2560,8,160,2,2,balanced,0.5108266671498617
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,6144,2560,8,160,1,4,power_law_1.2,1.63372802734375
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,6144,2560,8,160,2,2,balanced,1.00272003809611
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,6144,2560,8,160,2,2,balanced,0.5157546599706014
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,6144,2560,8,160,1,4,power_law_1.2,2.0086719512939455
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,6144,2560,8,160,2,2,balanced,1.032106637954712
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,6144,2560,8,160,2,2,balanced,0.5216266711552938
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,6144,2560,8,160,1,4,power_law_1.2,3.1679296493530273
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,6144,2560,8,160,2,2,balanced,1.054960012435913
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,6144,2560,8,160,2,2,balanced,0.5368853410085043
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,6144,2560,8,160,1,4,power_law_1.2,4.096934509277344
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,6144,2560,8,160,2,2,balanced,0.5386346578598022
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,6144,2560,8,160,2,2,balanced,1.458181381225586
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,6144,2560,8,160,1,4,power_law_1.2,5.923737716674805
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,6144,2560,8,160,2,2,balanced,0.5523093144098917
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,6144,2560,8,160,2,2,balanced,1.1983839670817058
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,6144,2560,8,160,2,2,power_law_1.01,0.14169600009918212
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,6144,2560,8,160,2,2,power_law_1.01,0.09297919869422913
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,6144,2560,8,160,1,4,power_law_1.2,7.104640197753906
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,6144,2560,8,160,2,2,balanced,0.647050658861796
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,6144,2560,8,160,2,2,power_law_1.01,0.1644863963127136
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,6144,2560,8,160,2,2,power_law_1.01,0.10815999507904053
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,6144,2560,8,160,2,2,balanced,0.6232426563898722
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,6144,2560,8,160,1,4,power_law_1.2,9.845062255859375
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,6144,2560,8,160,2,2,balanced,2.0350613594055176
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,6144,2560,8,160,2,2,power_law_1.01,0.16713600158691405
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,6144,2560,8,160,2,2,power_law_1.01,0.11484800577163697
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,6144,2560,8,160,2,2,balanced,0.07798400024573009
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,6144,2560,8,160,2,2,power_law_1.01,0.29189119338989256
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,6144,2560,8,160,2,2,balanced,0.9445119698842367
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,6144,2560,8,160,2,2,power_law_1.01,0.17239680290222167
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,6144,2560,8,160,1,4,power_law_1.2,14.907711791992188
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,6144,2560,8,160,2,2,power_law_1.01,0.3814591884613037
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,6144,2560,8,160,2,2,balanced,0.09698667128880818
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,6144,2560,8,160,2,2,power_law_1.01,0.2172032117843628
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,6144,2560,8,160,2,2,balanced,1.6081387201944988
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,6144,2560,8,160,2,2,balanced,0.7464586893717448
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,6144,2560,8,160,2,2,balanced,0.14313600460688272
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,6144,2560,8,160,2,2,power_law_1.01,0.6848063945770264
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,6144,2560,8,160,2,2,power_law_1.01,0.3838399887084961
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,6144,2560,8,160,2,2,balanced,0.2340480089187622
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,6144,2560,8,160,2,2,power_law_1.01,0.7233024120330811
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,6144,2560,8,160,2,2,power_law_1.01,0.40848641395568847
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,6144,2560,8,160,1,4,power_law_1.2,29.347213745117188
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,6144,2560,8,160,2,2,balanced,0.40459732214609784
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,6144,2560,8,160,2,2,balanced,1.147871971130371
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,6144,2560,8,160,2,2,power_law_1.01,0.8108223915100098
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,6144,2560,8,160,2,2,balanced,2.851781209309896
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,6144,2560,8,160,2,2,power_law_1.01,0.4276864051818848
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,6144,2560,8,160,2,2,balanced,0.5014079809188843
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,6144,2560,8,160,2,2,power_law_1.01,0.8046463966369629
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,6144,2560,8,160,2,2,power_law_1.01,0.42548480033874514
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,6144,2560,8,160,2,2,balanced,0.5032000144322714
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,6144,2560,8,160,2,2,power_law_1.01,0.8269951820373536
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,6144,2560,8,160,2,2,balanced,1.1030720074971516
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,6144,2560,8,160,2,2,balanced,0.5069813330968221
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,6144,2560,8,160,2,2,power_law_1.01,0.45090560913085936
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,6144,2560,8,160,2,2,power_law_1.01,0.8706175804138183
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,6144,2560,8,160,2,2,balanced,0.5139733155568441
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,6144,2560,8,160,2,2,power_law_1.01,0.4674560070037842
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,6144,2560,8,160,2,2,power_law_1.01,0.8925248146057129
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,6144,2560,8,160,2,2,balanced,2.9241441090901694
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,6144,2560,8,160,2,2,balanced,0.5175360043843588
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,6144,2560,8,160,2,2,power_law_1.01,0.47614078521728515
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,6144,2560,8,160,2,2,balanced,1.8523039817810059
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,6144,2560,8,160,2,2,power_law_1.01,0.9091072082519531
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,6144,2560,8,160,2,2,balanced,0.5244640111923218
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,6144,2560,8,160,2,2,power_law_1.01,0.49596800804138186
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,6144,2560,8,160,2,2,power_law_1.01,0.9068608283996582
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,6144,2560,8,160,2,2,balanced,0.5336746772130331
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,6144,2560,8,160,2,2,power_law_1.01,0.49477758407592776
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,6144,2560,8,160,2,2,power_law_1.01,0.9752896308898926
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,6144,2560,8,160,2,2,balanced,0.5397813320159912
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,6144,2560,8,160,2,2,power_law_1.01,0.5308608055114746
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,6144,2560,8,160,2,2,power_law_1.01,0.9910528182983398
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,6144,2560,8,160,2,2,balanced,0.5556639830271403
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,6144,2560,8,160,2,2,balanced,2.035242716471354
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,6144,2560,8,160,2,2,power_law_1.01,0.5698751926422119
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,6144,2560,8,160,2,2,balanced,4.30293337504069
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,6144,2560,8,160,2,2,power_law_1.01,1.01594877243042
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,6144,2560,8,160,2,2,balanced,0.5698133309682211
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,6144,2560,8,160,2,2,power_law_1.01,0.5695744037628174
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,6144,2560,8,160,2,2,power_law_1.01,1.175327968597412
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,6144,2560,8,160,2,2,power_law_1.01,0.6554175853729248
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,6144,2560,8,160,2,2,power_law_1.01,1.356480026245117
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,6144,2560,8,160,2,2,power_law_1.01,0.10474879741668701
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,6144,2560,8,160,2,2,power_law_1.01,0.720198392868042
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,6144,2560,8,160,2,2,power_law_1.01,1.6786815643310546
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,6144,2560,8,160,2,2,power_law_1.01,0.13303040266036986
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,6144,2560,8,160,2,2,power_law_1.01,0.11854720115661621
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,6144,2560,8,160,2,2,power_law_1.01,0.8680512428283691
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,6144,2560,8,160,2,2,power_law_1.01,1.6399360656738282
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,6144,2560,8,160,2,2,balanced,0.5843466520309448
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,6144,2560,8,160,2,2,power_law_1.01,0.1810431957244873
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,6144,2560,8,160,2,2,balanced,2.9098987579345703
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,6144,2560,8,160,2,2,power_law_1.01,0.9205504417419433
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,6144,2560,8,160,2,2,power_law_1.01,2.0087743759155274
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,6144,2560,8,160,2,2,power_law_1.01,0.22634239196777345
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,6144,2560,8,160,2,2,power_law_1.01,0.3953279972076416
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,6144,2560,8,160,2,2,power_law_1.01,1.1409215927124023
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,6144,2560,8,160,2,2,power_law_1.01,2.369299125671387
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,6144,2560,8,160,2,2,balanced,5.311866760253906
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,6144,2560,8,160,2,2,power_law_1.01,0.42207999229431153
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,6144,2560,8,160,2,2,power_law_1.01,1.4890687942504883
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,6144,2560,8,160,2,2,power_law_1.01,3.007232093811035
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,6144,2560,8,160,2,2,power_law_1.01,0.4395904064178467
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,6144,2560,8,160,2,2,balanced,0.6225546598434448
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,6144,2560,8,160,2,2,power_law_1.01,1.9509824752807616
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,6144,2560,8,160,2,2,power_law_1.01,3.6233409881591796
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,6144,2560,8,160,2,2,power_law_1.01,0.4576255798339844
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,6144,2560,8,160,2,2,power_law_1.01,0.4773695945739746
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,6144,2560,8,160,2,2,power_law_1.01,2.3521728515625
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,6144,2560,8,160,2,2,power_law_1.01,4.861888122558594
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,6144,2560,8,160,2,2,power_law_1.01,0.5216447830200195
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,6144,2560,8,160,2,2,power_law_1.01,0.5382847785949707
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,6144,2560,8,160,2,2,power_law_1.01,3.16058235168457
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,6144,2560,8,160,2,2,power_law_1.01,5.706521606445312
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,6144,2560,8,160,2,2,power_law_1.01,0.5734015941619873
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,6144,2560,8,160,2,2,power_law_1.01,4.046566390991211
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,6144,2560,8,160,2,2,balanced,3.6671520868937173
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,6144,2560,8,160,2,2,power_law_1.01,0.6333055973052979
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,6144,2560,8,160,2,2,power_law_1.01,6.949689483642578
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,6144,2560,8,160,2,2,power_law_1.01,0.6822015762329101
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,6144,2560,8,160,2,2,power_law_1.01,5.134835052490234
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,6144,2560,8,160,2,2,power_law_1.01,11.964985656738282
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,6144,2560,8,160,2,2,balanced,6.057610829671224
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,6144,2560,8,160,2,2,power_law_1.01,0.6541120052337647
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,6144,2560,8,160,2,2,balanced,0.7303840319315592
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,6144,2560,8,160,2,2,power_law_1.01,7.680140686035156
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,6144,2560,8,160,2,2,balanced,0.7958453496297201
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,6144,2560,8,160,2,2,power_law_1.01,22.08258514404297
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,6144,2560,8,160,2,2,power_law_1.01,0.7229440212249756
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,6144,2560,8,160,2,2,power_law_1.01,15.3782470703125
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,6144,2560,8,160,2,2,balanced,0.9506186644236246
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,6144,2560,8,160,2,2,power_law_1.2,0.1445312023162842
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,6144,2560,8,160,2,2,power_law_1.2,0.11280640363693237
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,6144,2560,8,160,2,2,balanced,1.087978680928548
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,6144,2560,8,160,2,2,power_law_1.01,0.8168448448181153
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,6144,2560,8,160,2,2,power_law_1.2,0.1613312005996704
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,6144,2560,8,160,2,2,power_law_1.01,0.9532032012939453
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,6144,2560,8,160,2,2,balanced,4.3130292892456055
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,6144,2560,8,160,2,2,power_law_1.2,0.258950400352478
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,6144,2560,8,160,2,2,power_law_1.01,1.1149824142456055
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,6144,2560,8,160,2,2,balanced,1.650752067565918
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,6144,2560,8,160,2,2,power_law_1.01,1.3320511817932128
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,6144,2560,8,160,2,2,power_law_1.2,0.3610368013381958
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,6144,2560,8,160,2,2,power_law_1.01,1.7325632095336914
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,6144,2560,8,160,2,2,power_law_1.2,0.701804780960083
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,6144,2560,8,160,2,2,power_law_1.01,2.1871999740600585
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,6144,2560,8,160,2,2,balanced,1.920570691426595
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,6144,2560,8,160,2,2,power_law_1.2,0.723583984375
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,6144,2560,8,160,2,2,power_law_1.01,2.9955263137817383
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,6144,2560,8,160,2,2,power_law_1.2,0.8150400161743164
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,6144,2560,8,160,2,2,power_law_1.01,3.992486572265625
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,6144,2560,8,160,2,2,power_law_1.2,0.8130623817443847
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,6144,2560,8,160,2,2,power_law_1.01,5.8640705108642575
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,6144,2560,8,160,2,2,balanced,2.8120107650756836
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,6144,2560,8,160,2,2,balanced,9.859301249186197
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,6144,2560,8,160,2,2,power_law_1.2,0.8146112442016602
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,6144,2560,8,160,2,2,power_law_1.01,8.02691192626953
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,6144,2560,8,160,2,2,power_law_1.2,0.8919168472290039
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,6144,2560,8,160,2,2,power_law_1.01,9.815699005126953
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,6144,2560,8,160,2,2,power_law_1.2,0.9141311645507812
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,6144,2560,8,160,2,2,power_law_1.2,0.9242239952087402
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,6144,2560,8,160,2,2,balanced,3.706629435221354
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,6144,2560,8,160,2,2,power_law_1.01,14.07838134765625
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,6144,2560,8,160,2,2,power_law_1.2,0.9529727935791016
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,6144,2560,8,160,2,2,power_law_1.2,0.9932991981506347
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,6144,2560,8,160,2,2,power_law_1.2,1.0220416069030762
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,6144,2560,8,160,2,2,power_law_1.01,30.13324890136719
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,6144,2560,8,160,2,2,balanced,6.843493143717448
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,6144,2560,8,160,2,2,power_law_1.2,1.0727104187011718
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,6144,2560,8,160,2,2,power_law_1.2,1.255558395385742
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,6144,2560,8,160,2,2,balanced,5.200218518575032
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,6144,2560,8,160,2,2,power_law_1.2,1.457811164855957
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,6144,2560,8,160,2,2,power_law_1.2,1.7818559646606444
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,6144,2560,8,160,2,2,power_law_1.2,1.6738176345825195
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,6144,2560,8,160,2,2,power_law_1.2,2.0478399276733397
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,6144,2560,8,160,2,2,power_law_1.2,2.526348876953125
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,6144,2560,8,160,2,2,power_law_1.2,3.2839935302734373
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,6144,2560,8,160,2,2,balanced,6.908730824788411
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,6144,2560,8,160,2,2,power_law_1.2,3.703443145751953
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,6144,2560,8,160,2,2,power_law_1.2,5.126963043212891
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,6144,2560,8,160,2,2,power_law_1.2,6.142374420166016
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,6144,2560,8,160,2,2,power_law_1.2,7.166252899169922
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,6144,2560,8,160,2,2,power_law_1.2,12.192179107666016
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,6144,2560,8,160,2,2,balanced,18.678117116292317
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,6144,2560,8,160,2,2,balanced,8.37393569946289
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,6144,2560,8,160,2,2,power_law_1.2,22.169407653808594
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,6144,2560,8,160,2,2,balanced,13.357935587565104
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,6144,2560,8,160,2,2,power_law_1.2,0.09367039799690247
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,6144,2560,8,160,2,2,power_law_1.2,0.07479040026664734
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,6144,2560,8,160,2,2,power_law_1.2,0.10266879796981812
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,6144,2560,8,160,2,2,power_law_1.2,0.16380800008773805
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,6144,2560,8,160,2,2,power_law_1.2,0.20103681087493896
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,6144,2560,8,160,2,2,balanced,13.752415974934896
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,6144,2560,8,160,2,2,power_law_1.2,0.3852672100067139
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,6144,2560,8,160,2,2,power_law_1.2,0.40723838806152346
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,6144,2560,8,160,2,2,power_law_1.2,0.42778239250183103
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,6144,2560,8,160,2,2,power_law_1.2,0.4496255874633789
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,6144,2560,8,160,2,2,power_law_1.2,0.4583744049072266
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,6144,2560,8,160,2,2,power_law_1.2,0.48305277824401854
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,6144,2560,8,160,2,2,power_law_1.2,0.4819200038909912
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,6144,2560,8,160,2,2,power_law_1.2,0.5159232139587402
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,6144,2560,8,160,2,2,power_law_1.2,0.5148223876953125
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,6144,2560,8,160,2,2,power_law_1.2,0.5494783878326416
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,6144,2560,8,160,2,2,power_law_1.2,0.578323221206665
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,6144,2560,8,160,2,2,power_law_1.2,0.5991680145263671
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,6144,2560,8,160,2,2,power_law_1.2,0.6834879875183105
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,6144,2560,8,160,2,2,power_law_1.2,0.7557951927185058
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,6144,2560,8,160,2,2,power_law_1.2,0.9034624099731445
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,6144,2560,8,160,2,2,power_law_1.2,0.9382783889770507
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,6144,2560,8,160,2,2,power_law_1.2,1.1757247924804688
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,6144,2560,8,160,2,2,power_law_1.2,1.578054428100586
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,6144,2560,8,160,2,2,power_law_1.2,1.9419391632080079
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,6144,2560,8,160,2,2,power_law_1.2,2.351091194152832
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,6144,2560,8,160,2,2,power_law_1.2,3.3795520782470705
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,6144,2560,8,160,2,2,balanced,27.9324951171875
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,6144,2560,8,160,2,2,power_law_1.2,4.60513916015625
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,6144,2560,8,160,4,1,balanced,0.09019733468691508
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,6144,2560,8,160,2,2,power_law_1.2,5.349305725097656
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,6144,2560,8,160,4,1,balanced,0.12502400080362955
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,6144,2560,8,160,2,2,power_law_1.2,0.10797439813613892
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,6144,2560,8,160,4,1,balanced,0.21668267250061035
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,6144,2560,8,160,2,2,power_law_1.2,0.09129599928855896
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,6144,2560,8,160,2,2,power_law_1.2,8.637862396240234
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,6144,2560,8,160,4,1,balanced,0.39686401685078937
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,6144,2560,8,160,2,2,power_law_1.2,0.11337599754333497
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,6144,2560,8,160,2,2,power_law_1.2,0.17640960216522217
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,6144,2560,8,160,4,1,balanced,0.7438240051269531
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,6144,2560,8,160,2,2,power_law_1.2,0.2370687961578369
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,6144,2560,8,160,4,1,balanced,0.9428319931030273
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,6144,2560,8,160,2,2,power_law_1.2,16.05055389404297
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,6144,2560,8,160,2,2,power_law_1.2,0.3799871921539307
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,6144,2560,8,160,4,1,balanced,0.9424586296081543
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,6144,2560,8,160,2,2,power_law_1.2,0.4146880149841309
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,6144,2560,8,160,2,2,power_law_1.2,0.44172158241271975
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,6144,2560,8,160,4,1,balanced,0.9475839932759603
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,6144,2560,8,160,2,2,power_law_1.2,0.4728576183319092
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,6144,2560,8,160,2,2,power_law_1.2,0.49879679679870603
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,6144,2560,8,160,4,1,balanced,0.9534347057342529
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,6144,2560,8,160,2,2,power_law_1.2,0.5289472103118896
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,6144,2560,8,160,4,1,balanced,0.9572266737620035
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,6144,2560,8,160,2,2,power_law_1.2,0.5550015926361084
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,6144,2560,8,160,2,2,power_law_1.2,0.5750400066375733
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,6144,2560,8,160,4,1,balanced,0.9565440018971761
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,6144,2560,8,160,2,2,power_law_1.2,0.6274496078491211
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,6144,2560,8,160,4,1,balanced,0.9645866552988688
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,6144,2560,8,160,2,2,power_law_1.2,0.6998591899871827
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,6144,2560,8,160,4,1,balanced,0.9691359996795654
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,6144,2560,8,160,4,1,balanced,0.9820000330607096
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,6144,2560,8,160,2,2,power_law_1.2,0.6756991863250732
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,6144,2560,8,160,4,1,balanced,1.0017706553141277
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,6144,2560,8,160,4,1,balanced,1.010975996653239
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,6144,2560,8,160,4,1,balanced,1.0337013403574626
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,6144,2560,8,160,2,2,power_law_1.2,0.7603392124176025
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,6144,2560,8,160,4,1,balanced,1.230240027109782
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,6144,2560,8,160,4,1,balanced,0.06679999828338623
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,6144,2560,8,160,4,1,balanced,1.1315146287282307
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,6144,2560,8,160,2,2,power_law_1.2,0.837286376953125
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,6144,2560,8,160,4,1,balanced,0.09074667096138
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,6144,2560,8,160,2,2,power_law_1.2,0.9723520278930664
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,6144,2560,8,160,4,1,balanced,0.13243732849756876
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,6144,2560,8,160,4,1,balanced,1.2894879976908367
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,6144,2560,8,160,2,2,power_law_1.2,1.1490303993225097
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,6144,2560,8,160,4,1,balanced,0.22889065742492676
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,6144,2560,8,160,4,1,balanced,0.4017546574274699
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,6144,2560,8,160,2,2,power_law_1.2,1.3966591835021973
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,6144,2560,8,160,4,1,balanced,1.334506670633952
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,6144,2560,8,160,4,1,balanced,0.49395732084910077
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,6144,2560,8,160,2,2,power_law_1.2,1.871001625061035
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,6144,2560,8,160,4,1,balanced,0.5009066661198934
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,6144,2560,8,160,2,2,power_law_1.2,2.375654411315918
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,6144,2560,8,160,4,1,balanced,0.5021760066350301
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,6144,2560,8,160,2,2,power_law_1.2,3.4107585906982423
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,6144,2560,8,160,4,1,balanced,2.0162347157796225
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,6144,2560,8,160,4,1,balanced,0.5143413146336874
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,6144,2560,8,160,2,2,power_law_1.2,4.195564651489258
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,6144,2560,8,160,4,1,balanced,0.5099306503931681
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,6144,2560,8,160,2,2,power_law_1.2,6.651213073730469
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,6144,2560,8,160,4,1,balanced,0.5201226472854614
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,6144,2560,8,160,4,1,balanced,1.9013172785441081
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,6144,2560,8,160,4,1,balanced,0.5246560176213583
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,6144,2560,8,160,2,2,power_law_1.2,8.287142181396485
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,6144,2560,8,160,4,1,balanced,0.5344320138295492
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,6144,2560,8,160,2,2,power_law_1.2,9.544831848144531
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,6144,2560,8,160,4,1,balanced,0.5575146675109863
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,6144,2560,8,160,4,1,balanced,3.7811946868896484
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,6144,2560,8,160,4,1,balanced,0.5668373505274454
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,6144,2560,8,160,2,2,power_law_1.2,17.387315368652345
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,6144,2560,8,160,4,1,balanced,0.5821119944254557
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,6144,2560,8,160,4,1,balanced,0.6049600044886271
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,6144,2560,8,160,2,2,power_law_1.2,33.73353576660156
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,6144,2560,8,160,4,1,balanced,3.5114399592081704
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,6144,2560,8,160,4,1,balanced,0.7510560353597006
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,6144,2560,8,160,4,1,balanced,0.7069599628448486
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,6144,2560,8,160,4,1,power_law_1.01,0.0902783989906311
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,6144,2560,8,160,4,1,balanced,0.10115200281143188
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,6144,2560,8,160,4,1,balanced,0.9219146569569906
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,6144,2560,8,160,4,1,power_law_1.01,0.11426559686660767
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,6144,2560,8,160,4,1,balanced,0.11872532963752747
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,6144,2560,8,160,4,1,power_law_1.01,0.06722559928894042
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,6144,2560,8,160,4,1,power_law_1.01,0.16506240367889405
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,6144,2560,8,160,4,1,balanced,0.8984906673431396
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,6144,2560,8,160,4,1,balanced,0.16724266608556113
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,6144,2560,8,160,4,1,balanced,4.6780961354573565
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,6144,2560,8,160,4,1,power_law_1.01,0.2895359992980957
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,6144,2560,8,160,4,1,power_law_1.01,0.07905279994010925
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,6144,2560,8,160,4,1,balanced,0.2641226649284363
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,6144,2560,8,160,4,1,power_law_1.01,0.39792640209198
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,6144,2560,8,160,4,1,balanced,1.3787466684977214
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,6144,2560,8,160,4,1,power_law_1.01,0.10628479719161987
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,6144,2560,8,160,4,1,balanced,0.4380906820297241
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,6144,2560,8,160,4,1,power_law_1.01,0.6918272018432617
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,6144,2560,8,160,4,1,power_law_1.01,0.17480319738388062
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,6144,2560,8,160,4,1,balanced,0.5389440059661865
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,6144,2560,8,160,4,1,power_law_1.01,0.7626495838165284
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,6144,2560,8,160,4,1,balanced,0.5463093519210815
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,6144,2560,8,160,4,1,power_law_1.01,0.23158400058746337
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,6144,2560,8,160,4,1,balanced,1.4221493403116863
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,6144,2560,8,160,4,1,power_law_1.01,0.7910399913787842
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,6144,2560,8,160,4,1,balanced,0.5557813247044882
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,6144,2560,8,160,4,1,power_law_1.01,0.3751424074172974
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,6144,2560,8,160,4,1,balanced,0.562122662862142
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,6144,2560,8,160,4,1,power_law_1.01,0.7933504104614257
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,6144,2560,8,160,4,1,power_law_1.01,0.4035776138305664
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,6144,2560,8,160,4,1,balanced,6.304128011067708
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,6144,2560,8,160,4,1,balanced,0.5672959884007772
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,6144,2560,8,160,4,1,power_law_1.01,0.798195219039917
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,6144,2560,8,160,4,1,power_law_1.01,0.4197120189666748
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,6144,2560,8,160,4,1,balanced,2.322762648264567
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,6144,2560,8,160,4,1,balanced,0.5797280073165894
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,6144,2560,8,160,4,1,power_law_1.01,0.4377151966094971
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,6144,2560,8,160,4,1,power_law_1.01,0.8460479736328125
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,6144,2560,8,160,4,1,balanced,0.5918026765187582
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,6144,2560,8,160,4,1,power_law_1.01,0.4520256042480469
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,6144,2560,8,160,4,1,power_law_1.01,0.8678208351135254
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,6144,2560,8,160,4,1,balanced,0.6060800155003866
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,6144,2560,8,160,4,1,power_law_1.01,0.4880959987640381
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,6144,2560,8,160,4,1,power_law_1.01,0.8968064308166503
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,6144,2560,8,160,4,1,balanced,0.6302666664123535
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,6144,2560,8,160,4,1,power_law_1.01,0.5176832199096679
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,6144,2560,8,160,4,1,power_law_1.01,0.9277055740356446
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,6144,2560,8,160,4,1,balanced,2.656010627746582
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,6144,2560,8,160,4,1,balanced,0.6633866628011068
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,6144,2560,8,160,4,1,power_law_1.01,0.5289216041564941
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,6144,2560,8,160,4,1,power_law_1.01,0.9429632186889648
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,6144,2560,8,160,4,1,power_law_1.01,0.5361087799072266
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,6144,2560,8,160,4,1,power_law_1.01,1.0194432258605957
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,6144,2560,8,160,4,1,power_law_1.01,0.5477375984191895
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,6144,2560,8,160,4,1,power_law_1.01,1.0499967575073241
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,6144,2560,8,160,4,1,balanced,7.691439946492513
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,6144,2560,8,160,4,1,power_law_1.01,0.5675456047058105
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,6144,2560,8,160,4,1,balanced,0.708026647567749
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,6144,2560,8,160,4,1,power_law_1.01,1.1782272338867188
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,6144,2560,8,160,4,1,power_law_1.01,0.6287551879882812
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,6144,2560,8,160,4,1,power_law_1.01,1.3341119766235352
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,6144,2560,8,160,4,1,balanced,3.6980905532836914
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,6144,2560,8,160,4,1,power_law_1.01,0.7193024158477783
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,6144,2560,8,160,4,1,power_law_1.01,1.6198400497436523
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,6144,2560,8,160,4,1,power_law_1.01,0.775654411315918
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,6144,2560,8,160,4,1,power_law_1.01,1.7250112533569335
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,6144,2560,8,160,4,1,power_law_1.01,0.9263872146606446
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,6144,2560,8,160,4,1,balanced,0.7694239616394043
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,6144,2560,8,160,4,1,power_law_1.01,2.2230079650878904
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,6144,2560,8,160,4,1,power_law_1.01,1.0143872261047364
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,6144,2560,8,160,4,1,power_law_1.01,1.3067392349243163
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,6144,2560,8,160,4,1,power_law_1.01,2.939743995666504
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,6144,2560,8,160,4,1,power_law_1.01,1.7570432662963866
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,6144,2560,8,160,4,1,power_law_1.01,3.7375038146972654
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,6144,2560,8,160,4,1,power_law_1.01,2.276371192932129
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,6144,2560,8,160,4,1,balanced,4.860768000284831
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,6144,2560,8,160,4,1,power_law_1.01,3.580281448364258
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,6144,2560,8,160,4,1,power_law_1.01,2.646668815612793
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,6144,2560,8,160,4,1,balanced,0.9276373386383057
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,6144,2560,8,160,4,1,power_law_1.01,5.063276672363282
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,6144,2560,8,160,4,1,power_law_1.01,3.7400062561035154
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,6144,2560,8,160,4,1,balanced,1.040549357732137
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,6144,2560,8,160,4,1,power_law_1.01,6.602150726318359
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,6144,2560,8,160,4,1,power_law_1.01,4.876275253295899
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,6144,2560,8,160,4,1,balanced,11.99289067586263
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,6144,2560,8,160,4,1,balanced,1.3276693026224773
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,6144,2560,8,160,4,1,power_law_1.01,8.18787841796875
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,6144,2560,8,160,4,1,power_law_1.01,6.1539966583251955
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,6144,2560,8,160,4,1,balanced,1.577082633972168
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,6144,2560,8,160,4,1,power_law_1.01,9.973939514160156
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,6144,2560,8,160,4,1,power_law_1.01,13.087405395507812
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,6144,2560,8,160,4,1,balanced,5.834746678670247
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,6144,2560,8,160,4,1,balanced,2.4114559491475425
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,6144,2560,8,160,4,1,power_law_1.01,19.73157196044922
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,6144,2560,8,160,4,1,power_law_1.01,0.0988864004611969
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,6144,2560,8,160,4,1,power_law_1.01,23.334072875976563
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,6144,2560,8,160,4,1,power_law_1.01,0.1245695948600769
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,6144,2560,8,160,4,1,balanced,2.8998133341471353
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,6144,2560,8,160,4,1,power_law_1.01,0.13878400325775148
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,6144,2560,8,160,4,1,power_law_1.01,0.19699840545654296
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,6144,2560,8,160,4,1,power_law_1.01,0.252729606628418
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,6144,2560,8,160,4,1,power_law_1.2,0.08992000222206116
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,6144,2560,8,160,4,1,balanced,4.273008028666179
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,6144,2560,8,160,4,1,power_law_1.01,0.4195712089538574
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,6144,2560,8,160,4,1,power_law_1.2,0.09976959824562073
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,6144,2560,8,160,4,1,power_law_1.01,0.4463168144226074
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,6144,2560,8,160,4,1,power_law_1.2,0.1612223982810974
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,6144,2560,8,160,4,1,power_law_1.01,0.4678976058959961
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,6144,2560,8,160,4,1,power_law_1.2,0.25512959957122805
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,6144,2560,8,160,4,1,power_law_1.01,0.4924160003662109
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,6144,2560,8,160,4,1,power_law_1.2,0.35953919887542723
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,6144,2560,8,160,4,1,balanced,5.6486771901448565
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,6144,2560,8,160,4,1,power_law_1.01,0.5100863933563232
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,6144,2560,8,160,4,1,power_law_1.2,0.6803199768066406
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,6144,2560,8,160,4,1,power_law_1.01,0.5637695789337158
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,6144,2560,8,160,4,1,power_law_1.2,0.7604032039642334
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,6144,2560,8,160,4,1,balanced,9.317157109578451
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,6144,2560,8,160,4,1,power_law_1.01,0.5980671882629395
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,6144,2560,8,160,4,1,power_law_1.2,0.7917439937591553
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,6144,2560,8,160,4,1,power_law_1.01,0.6345471858978271
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,6144,2560,8,160,4,1,power_law_1.2,0.8344896316528321
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,6144,2560,8,160,4,1,power_law_1.01,0.7027008056640625
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,6144,2560,8,160,4,1,power_law_1.2,0.8530176162719727
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,6144,2560,8,160,4,1,balanced,8.02181307474772
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,6144,2560,8,160,4,1,power_law_1.2,0.8750399589538574
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,6144,2560,8,160,4,1,power_law_1.01,0.785100793838501
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,6144,2560,8,160,4,1,power_law_1.2,0.9009663581848144
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,6144,2560,8,160,4,1,power_law_1.2,0.9255488395690918
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,6144,2560,8,160,4,1,power_law_1.01,0.7843008041381836
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,6144,2560,8,160,4,1,power_law_1.2,0.9668800354003906
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,6144,2560,8,160,4,1,power_law_1.2,1.0094783782958985
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,6144,2560,8,160,4,1,balanced,23.1627197265625
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,6144,2560,8,160,4,1,power_law_1.2,1.0380800247192383
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,6144,2560,8,160,4,1,power_law_1.01,0.8654080390930176
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,6144,2560,8,160,4,1,power_law_1.2,1.076352024078369
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,6144,2560,8,160,4,1,balanced,10.74448013305664
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,6144,2560,8,160,4,1,power_law_1.2,1.2241151809692383
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,6144,2560,8,160,4,1,power_law_1.01,0.9847231864929199
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,6144,2560,8,160,4,1,power_law_1.2,1.3761088371276855
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,6144,2560,8,160,4,1,power_law_1.2,1.7036672592163087
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,6144,2560,8,160,4,1,power_law_1.01,1.1572735786437989
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,6144,2560,8,160,4,1,power_law_1.2,1.7724927902221679
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,6144,2560,8,160,4,1,power_law_1.01,1.408473587036133
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,6144,2560,8,160,4,1,power_law_1.01,1.7204288482666015
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,6144,2560,8,160,4,1,power_law_1.2,2.2515584945678713
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,6144,2560,8,160,4,1,power_law_1.2,3.0226879119873047
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,6144,2560,8,160,4,1,power_law_1.01,2.33319034576416
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,6144,2560,8,160,4,1,power_law_1.01,2.9502912521362306
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,6144,2560,8,160,4,1,power_law_1.2,3.864064025878906
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,6144,2560,8,160,4,1,balanced,13.056543986002604
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,6144,2560,8,160,4,1,power_law_1.2,0.06680319905281067
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,6144,2560,8,160,4,1,power_law_1.2,3.6994369506835936
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,6144,2560,8,160,4,1,power_law_1.01,4.195616149902344
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,6144,2560,8,160,4,1,power_law_1.2,0.07007359862327575
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,6144,2560,8,160,4,1,power_law_1.2,5.167814254760742
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,6144,2560,8,160,4,1,power_law_1.01,5.430144119262695
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,6144,2560,8,160,4,1,power_law_1.2,0.1068608045578003
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,6144,2560,8,160,4,1,power_law_1.2,0.1538624048233032
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,6144,2560,8,160,4,1,power_law_1.2,6.871756744384766
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,6144,2560,8,160,4,1,power_law_1.2,0.20480639934539796
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,6144,2560,8,160,4,1,power_law_1.01,7.925132751464844
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,6144,2560,8,160,4,1,power_law_1.2,0.37285120487213136
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,6144,2560,8,160,4,1,power_law_1.2,0.41592960357666015
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,6144,2560,8,160,4,1,power_law_1.2,8.452153778076172
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,6144,2560,8,160,4,1,power_law_1.01,10.40711669921875
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,6144,2560,8,160,4,1,balanced,18.65117899576823
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,6144,2560,8,160,4,1,power_law_1.2,0.42817277908325196
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,6144,2560,8,160,4,1,power_law_1.2,0.45792641639709475
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,6144,2560,8,160,4,1,power_law_1.2,0.4651199817657471
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,6144,2560,8,160,4,1,power_law_1.2,13.362419128417969
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,6144,2560,8,160,4,1,power_law_1.01,12.926521301269531
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,6144,2560,8,160,4,1,power_law_1.2,0.5147391796112061
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,6144,2560,8,160,4,1,power_law_1.2,0.5288576126098633
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,6144,2560,8,160,4,1,power_law_1.2,0.5636672019958496
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,6144,2560,8,160,4,1,power_law_1.01,20.53368377685547
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,6144,2560,8,160,4,1,power_law_1.2,0.5462592124938965
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,6144,2560,8,160,4,1,power_law_1.2,23.290342712402342
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,6144,2560,8,160,4,1,power_law_1.2,0.562828779220581
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,6144,2560,8,160,4,1,power_law_1.2,0.5919551849365234
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,6144,2560,8,160,4,1,power_law_1.2,0.6443840026855469
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,6144,2560,8,160,4,1,balanced,21.199535369873047
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,6144,2560,8,160,4,1,power_law_1.2,0.7380799770355224
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,6144,2560,8,160,4,1,power_law_1.01,40.957037353515624
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,6144,2560,8,160,4,1,power_law_1.2,0.8014016151428223
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,6144,2560,8,160,4,1,power_law_1.2,0.9478655815124511
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,6144,2560,8,160,4,1,power_law_1.2,1.0558719635009766
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,6144,2560,8,160,4,1,power_law_1.2,1.33689603805542
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,6144,2560,8,160,4,1,power_law_1.2,1.7848447799682616
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,6144,2560,8,160,4,1,power_law_1.2,2.327609634399414
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,6144,2560,8,160,4,1,power_law_1.2,2.6804224014282227
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,6144,2560,8,160,4,1,power_law_1.2,3.8200897216796874
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,6144,2560,8,160,4,1,power_law_1.2,5.144204711914062
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,6144,2560,8,160,4,1,power_law_1.2,6.358015823364258
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,6144,2560,8,160,4,1,power_law_1.2,10.014950561523438
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,6144,2560,8,160,4,1,power_law_1.2,19.70598449707031
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,6144,2560,8,160,4,1,balanced,42.039326985677086
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,7168,2048,8,384,1,4,balanced,0.08992532889048259
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,7168,2048,8,384,1,4,balanced,0.12149866422017415
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,6144,2560,8,160,4,1,power_law_1.2,0.09957759976387023
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,7168,2048,8,384,1,4,balanced,0.2007840077082316
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,6144,2560,8,160,4,1,power_law_1.2,0.10819840431213379
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,7168,2048,8,384,1,4,balanced,0.3649226824442546
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,7168,2048,8,384,1,4,balanced,0.6921546459197998
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,6144,2560,8,160,4,1,power_law_1.2,0.13359999656677246
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,7168,2048,8,384,1,4,balanced,1.3360586166381836
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,6144,2560,8,160,4,1,power_law_1.2,0.18491519689559938
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,7168,2048,8,384,1,4,balanced,1.9787947336832683
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,6144,2560,8,160,4,1,power_law_1.2,0.22633600234985352
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,6144,2560,8,160,4,1,power_law_1.2,0.40729598999023436
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,7168,2048,8,384,1,4,balanced,1.9756107330322266
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,6144,2560,8,160,4,1,power_law_1.2,0.4501503944396973
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,7168,2048,8,384,1,4,balanced,1.9780213038126628
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,6144,2560,8,160,4,1,power_law_1.2,0.4794367790222168
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,7168,2048,8,384,1,4,balanced,1.9802613258361816
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,7168,2048,8,384,1,4,balanced,1.9761813481648762
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,6144,2560,8,160,4,1,power_law_1.2,0.5045887947082519
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,7168,2048,8,384,1,4,balanced,1.9882346789042156
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,6144,2560,8,160,4,1,power_law_1.2,0.527020788192749
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,6144,2560,8,160,4,1,power_law_1.2,0.5731071949005127
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,7168,2048,8,384,1,4,balanced,2.006074587504069
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,6144,2560,8,160,4,1,power_law_1.2,0.622156810760498
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,7168,2048,8,384,1,4,balanced,2.001866658528646
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,6144,2560,8,160,4,1,power_law_1.2,0.6539328098297119
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,7168,2048,8,384,1,4,balanced,2.016032059987386
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,6144,2560,8,160,4,1,power_law_1.2,0.7250432014465332
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,7168,2048,8,384,1,4,balanced,2.032250722249349
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,6144,2560,8,160,4,1,power_law_1.2,0.7946879863739014
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,7168,2048,8,384,1,4,balanced,2.0353493690490723
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,7168,2048,8,384,1,4,balanced,0.06657599906126659
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,7168,2048,8,384,1,4,balanced,2.059226671854655
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,6144,2560,8,160,4,1,power_law_1.2,0.7902016162872314
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,7168,2048,8,384,1,4,balanced,0.08309866487979889
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,7168,2048,8,384,1,4,balanced,2.1039466857910156
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,7168,2048,8,384,1,4,balanced,0.12627200285593668
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,7168,2048,8,384,1,4,balanced,0.21089067061742148
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,6144,2560,8,160,4,1,power_law_1.2,0.8844608306884766
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,7168,2048,8,384,1,4,balanced,2.167797406514486
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,7168,2048,8,384,1,4,balanced,0.37146135171254474
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,7168,2048,8,384,1,4,balanced,0.6941866874694824
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,7168,2048,8,384,1,4,balanced,2.228853384653727
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,7168,2048,8,384,1,4,balanced,1.018506685892741
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,6144,2560,8,160,4,1,power_law_1.2,1.0066495895385743
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,7168,2048,8,384,1,4,balanced,1.0202186902364094
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,6144,2560,8,160,4,1,power_law_1.2,1.1618240356445313
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,7168,2048,8,384,1,4,balanced,1.0228853225708008
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,7168,2048,8,384,1,4,balanced,2.3118185997009277
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,6144,2560,8,160,4,1,power_law_1.2,1.4207807540893556
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,7168,2048,8,384,1,4,balanced,1.0275946458180745
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,7168,2048,8,384,1,4,balanced,1.0320266882578533
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,6144,2560,8,160,4,1,power_law_1.2,1.732748794555664
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,7168,2048,8,384,1,4,balanced,1.0307199954986572
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,7168,2048,8,384,1,4,balanced,2.4583093325297036
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,6144,2560,8,160,4,1,power_law_1.2,2.3619968414306642
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,7168,2048,8,384,1,4,balanced,1.0360906918843586
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,6144,2560,8,160,4,1,power_law_1.2,2.9770751953125
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,7168,2048,8,384,1,4,balanced,1.046026627222697
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,6144,2560,8,160,4,1,power_law_1.2,4.203609466552734
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,7168,2048,8,384,1,4,balanced,1.0562079747517903
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,7168,2048,8,384,1,4,balanced,2.6255146662394204
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,7168,2048,8,384,1,4,balanced,1.0670666694641113
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,6144,2560,8,160,4,1,power_law_1.2,5.445305633544922
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,7168,2048,8,384,1,4,balanced,1.083136002222697
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,6144,2560,8,160,4,1,power_law_1.2,7.9324798583984375
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,7168,2048,8,384,1,4,balanced,1.1131680011749268
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,7168,2048,8,384,1,4,balanced,3.2248748143514
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,6144,2560,8,160,4,1,power_law_1.2,10.433907318115235
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,7168,2048,8,384,1,4,balanced,1.1434933344523113
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,7168,2048,8,384,1,4,balanced,1.1918346881866455
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,6144,2560,8,160,4,1,power_law_1.2,12.906405639648437
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,7168,2048,8,384,1,4,power_law_1.01,0.13333120346069335
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,7168,2048,8,384,1,4,balanced,0.07982400059700012
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,7168,2048,8,384,1,4,balanced,1.2341279983520508
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,7168,2048,8,384,1,4,power_law_1.01,0.20253438949584962
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,6144,2560,8,160,4,1,power_law_1.2,20.418476867675782
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,7168,2048,8,384,1,4,balanced,0.09662933150927226
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,7168,2048,8,384,1,4,power_law_1.01,0.2030656099319458
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,7168,2048,8,384,1,4,power_law_1.01,0.3603584051132202
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,7168,2048,8,384,1,4,balanced,3.482954661051432
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,7168,2048,8,384,1,4,balanced,1.3287253379821777
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,7168,2048,8,384,1,4,balanced,0.1418506701787313
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,7168,2048,8,384,1,4,power_law_1.01,0.3712768077850342
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,7168,2048,8,384,1,4,balanced,0.2351093292236328
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,7168,2048,8,384,1,4,power_law_1.01,0.6792319774627685
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,7168,2048,8,384,1,4,power_law_1.01,0.181222403049469
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,7168,2048,8,384,1,4,balanced,0.3810559908548991
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,7168,2048,8,384,1,4,power_law_1.01,0.2932415962219238
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,7168,2048,8,384,1,4,balanced,1.4476159413655598
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,6144,2560,8,160,4,1,power_law_1.2,40.614810180664065
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,7168,2048,8,384,1,4,power_law_1.01,0.3248447895050049
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,7168,2048,8,384,1,4,balanced,0.7059573332468668
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,7168,2048,8,384,1,4,power_law_1.01,0.597376012802124
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,7168,2048,8,384,1,4,balanced,1.0295999844868977
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,7168,2048,8,384,1,4,power_law_1.01,0.431334400177002
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,7168,2048,8,384,1,4,power_law_1.01,0.8415424346923828
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,7168,2048,8,384,1,4,balanced,1.032431999842326
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,7168,2048,8,384,1,4,power_law_1.01,0.5092288017272949
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,7168,2048,8,384,1,4,balanced,1.611146608988444
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,7168,2048,8,384,1,4,balanced,1.0320800145467122
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,7168,2048,8,384,1,4,power_law_1.01,0.9488832473754882
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,7168,2048,8,384,1,4,power_law_1.01,0.6773824214935302
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,7168,2048,8,384,1,4,balanced,4.874719937642415
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,7168,2048,8,384,1,4,balanced,1.0368320147196453
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,7168,2048,8,384,1,4,power_law_1.01,1.2828096389770507
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,7168,2048,8,384,1,4,power_law_1.01,0.683513593673706
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,7168,2048,8,384,1,4,balanced,1.0418132940928142
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,7168,2048,8,384,1,4,power_law_1.01,1.3357248306274414
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,7168,2048,8,384,1,4,power_law_1.01,0.7213568210601806
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,7168,2048,8,384,1,4,balanced,1.0469653606414795
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,7168,2048,8,384,1,4,balanced,2.0774292945861816
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,7168,2048,8,384,1,4,power_law_1.01,1.3027135848999023
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,7168,2048,8,384,1,4,power_law_1.01,0.7403264045715332
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,7168,2048,8,384,1,4,balanced,1.0510506629943848
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,7168,2048,8,384,1,4,power_law_1.01,1.4049087524414063
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,7168,2048,8,384,1,4,balanced,1.060634692509969
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,7168,2048,8,384,1,4,power_law_1.01,0.7851903915405274
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,7168,2048,8,384,1,4,power_law_1.01,1.5202176094055175
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,7168,2048,8,384,1,4,power_law_1.01,0.15896320343017578
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,7168,2048,8,384,1,4,balanced,1.0747893651326497
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,7168,2048,8,384,1,4,power_law_1.01,0.7728384017944336
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,7168,2048,8,384,1,4,power_law_1.01,1.554911994934082
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,7168,2048,8,384,1,4,power_law_1.01,0.23215360641479493
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,7168,2048,8,384,1,4,power_law_1.01,1.6642816543579102
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,7168,2048,8,384,1,4,balanced,1.0869706471761067
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,7168,2048,8,384,1,4,power_law_1.01,0.8219200134277344
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,7168,2048,8,384,1,4,balanced,2.400815963745117
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,7168,2048,8,384,1,4,balanced,6.23194694519043
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,7168,2048,8,384,1,4,power_law_1.01,0.3945280075073242
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,7168,2048,8,384,1,4,power_law_1.01,1.7410240173339844
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,7168,2048,8,384,1,4,balanced,1.1065706411997478
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,7168,2048,8,384,1,4,power_law_1.01,0.8805695533752441
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,7168,2048,8,384,1,4,power_law_1.01,0.1968191981315613
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,7168,2048,8,384,1,4,power_law_1.01,1.873619270324707
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,7168,2048,8,384,1,4,power_law_1.01,0.8977472305297851
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,7168,2048,8,384,1,4,power_law_1.01,0.3274944067001343
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,7168,2048,8,384,1,4,balanced,1.1546986897786458
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,7168,2048,8,384,1,4,power_law_1.01,0.4585087776184082
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,7168,2048,8,384,1,4,power_law_1.01,0.9499327659606933
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,7168,2048,8,384,1,4,power_law_1.01,1.7392383575439454
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,7168,2048,8,384,1,4,power_law_1.01,0.5310463905334473
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,7168,2048,8,384,1,4,power_law_1.01,1.051308822631836
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,7168,2048,8,384,1,4,power_law_1.01,1.9483583450317383
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,7168,2048,8,384,1,4,power_law_1.01,0.7027328014373779
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,7168,2048,8,384,1,4,power_law_1.01,1.1570624351501464
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,7168,2048,8,384,1,4,power_law_1.01,0.7193727970123291
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,7168,2048,8,384,1,4,power_law_1.01,2.310540771484375
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,7168,2048,8,384,1,4,power_law_1.01,0.7447360038757325
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,7168,2048,8,384,1,4,power_law_1.01,1.4255423545837402
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,384,1,4,balanced,1.2089172999064128
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,7168,2048,8,384,1,4,power_law_1.01,2.7829568862915037
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,7168,2048,8,384,1,4,balanced,3.2960265477498374
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,7168,2048,8,384,1,4,power_law_1.01,0.7950399875640869
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,7168,2048,8,384,1,4,power_law_1.01,1.3308799743652344
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,7168,2048,8,384,1,4,power_law_1.01,0.8309247970581055
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,7168,2048,8,384,1,4,power_law_1.01,2.700467109680176
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,7168,2048,8,384,1,4,power_law_1.01,1.6552768707275392
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,7168,2048,8,384,1,4,power_law_1.01,0.8752256393432617
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,7168,2048,8,384,1,4,power_law_1.01,3.338713455200195
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,7168,2048,8,384,1,4,power_law_1.01,0.9432895660400391
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,7168,2048,8,384,1,4,power_law_1.01,1.8960704803466797
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,7168,2048,8,384,1,4,power_law_1.2,0.22387199401855468
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,7168,2048,8,384,1,4,power_law_1.01,1.0010368347167968
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,7168,2048,8,384,1,4,power_law_1.01,2.8427263259887696
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,7168,2048,8,384,1,4,power_law_1.01,2.4216447830200196
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,7168,2048,8,384,1,4,power_law_1.01,1.0829440116882325
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,7168,2048,8,384,1,4,power_law_1.2,0.36094720363616944
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,7168,2048,8,384,1,4,power_law_1.01,1.1498111724853515
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,7168,2048,8,384,1,4,power_law_1.01,3.4524417877197267
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,7168,2048,8,384,1,4,power_law_1.01,2.813420867919922
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,7168,2048,8,384,1,4,balanced,9.23086929321289
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,7168,2048,8,384,1,4,power_law_1.2,0.33314559459686277
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,384,1,4,balanced,1.3244640032450359
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,7168,2048,8,384,1,4,power_law_1.01,1.436793613433838
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,7168,2048,8,384,1,4,power_law_1.01,3.6499454498291017
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,7168,2048,8,384,1,4,power_law_1.01,4.584543991088867
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,7168,2048,8,384,1,4,power_law_1.2,0.31550719738006594
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,384,1,4,balanced,1.4171199798583984
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,7168,2048,8,384,1,4,power_law_1.2,0.5099967956542969
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,7168,2048,8,384,1,4,balanced,4.248933474222819
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,7168,2048,8,384,1,4,power_law_1.01,4.041177749633789
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,384,1,4,power_law_1.01,1.423731231689453
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,7168,2048,8,384,1,4,power_law_1.01,5.621670532226562
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,7168,2048,8,384,1,4,power_law_1.2,0.7515135765075683
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,7168,2048,8,384,1,4,power_law_1.01,5.216614532470703
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,384,1,4,balanced,1.6061333020528157
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,7168,2048,8,384,1,4,power_law_1.01,6.343699264526367
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,7168,2048,8,384,1,4,power_law_1.2,0.8623104095458984
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,384,1,4,power_law_1.01,1.4179455757141113
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,7168,2048,8,384,1,4,power_law_1.01,7.747789001464843
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,7168,2048,8,384,1,4,power_law_1.2,1.179308795928955
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,7168,2048,8,384,1,4,power_law_1.01,7.542572784423828
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,384,1,4,power_law_1.01,1.651807975769043
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,384,1,4,balanced,1.9087200164794922
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,7168,2048,8,384,1,4,power_law_1.2,1.2660863876342774
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,384,1,4,power_law_1.01,2.0788991928100584
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,384,1,4,power_law_1.01,2.32926082611084
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,7168,2048,8,384,1,4,power_law_1.01,12.224384307861328
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,7168,2048,8,384,1,4,power_law_1.2,1.3267711639404296
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,7168,2048,8,384,1,4,power_law_1.01,15.638796997070312
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,384,1,4,power_law_1.01,3.13753604888916
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,7168,2048,8,384,1,4,power_law_1.2,1.4049023628234862
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,384,1,4,balanced,2.2064852714538574
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,384,1,4,power_law_1.01,3.8897151947021484
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,7168,2048,8,384,1,4,power_law_1.2,1.4496959686279296
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,7168,2048,8,384,1,4,power_law_1.01,23.837184143066406
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,384,1,4,power_law_1.01,5.486387252807617
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,7168,2048,8,384,1,4,power_law_1.2,1.4703616142272948
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,384,1,4,power_law_1.01,7.3003074645996096
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,7168,2048,8,384,1,4,power_law_1.2,1.7172864913940429
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,384,1,4,balanced,3.287285486857096
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,384,1,4,power_law_1.01,8.561491394042969
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,7168,2048,8,384,1,4,power_law_1.2,1.7483648300170898
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,7168,2048,8,384,1,4,balanced,6.219568252563477
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,7168,2048,8,384,1,4,power_law_1.2,1.9759040832519532
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,384,1,4,power_law_1.01,12.980557250976563
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,7168,2048,8,384,1,4,power_law_1.2,1.7401344299316406
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,384,1,4,power_law_1.01,27.83743896484375
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,7168,2048,8,384,1,4,power_law_1.2,2.0329919815063477
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,384,1,4,balanced,4.01144536336263
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,7168,2048,8,384,1,4,power_law_1.2,2.3971967697143555
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,7168,2048,8,384,1,4,power_law_1.2,3.0908735275268553
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,7168,2048,8,384,1,4,power_law_1.2,2.8772287368774414
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,7168,2048,8,384,1,4,balanced,17.228159586588543
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,7168,2048,8,384,1,4,power_law_1.2,3.7
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,7168,2048,8,384,1,4,power_law_1.2,3.0951679229736326
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,7168,2048,8,384,1,4,power_law_1.2,3.6291648864746096
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,384,1,4,balanced,5.627541224161784
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,7168,2048,8,384,1,4,power_law_1.2,5.093260955810547
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,7168,2048,8,384,1,4,power_law_1.2,6.267712020874024
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,7168,2048,8,384,1,4,power_law_1.2,7.1933441162109375
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,7168,2048,8,384,1,4,power_law_1.2,8.442822265625
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,384,1,4,balanced,7.38052241007487
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,7168,2048,8,384,1,4,power_law_1.2,13.270669555664062
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,7168,2048,8,384,1,4,power_law_1.2,30.314105224609374
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,7168,2048,8,384,1,4,balanced,11.903024037679037
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,7168,2048,8,384,1,4,power_law_1.2,0.1329408049583435
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,7168,2048,8,384,1,4,power_law_1.2,0.20237441062927247
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,7168,2048,8,384,1,4,power_law_1.2,0.20134398937225342
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,384,1,4,balanced,11.460037231445312
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,7168,2048,8,384,1,4,power_law_1.2,0.17993600368499757
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,7168,2048,8,384,1,4,power_law_1.2,0.27935359477996824
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,7168,2048,8,384,1,4,power_law_1.2,0.42357759475708007
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,7168,2048,8,384,1,4,power_law_1.2,0.4509568214416504
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,7168,2048,8,384,1,4,power_law_1.2,0.6384191989898682
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,7168,2048,8,384,1,4,power_law_1.2,0.6594431877136231
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,7168,2048,8,384,1,4,power_law_1.2,0.6520832061767579
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,7168,2048,8,384,1,4,power_law_1.2,0.7438271999359131
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,7168,2048,8,384,1,4,power_law_1.2,0.7491648197174072
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,7168,2048,8,384,1,4,power_law_1.2,0.7449920177459717
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,7168,2048,8,384,1,4,power_law_1.2,0.8487808227539062
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,7168,2048,8,384,1,4,power_law_1.2,0.8832896232604981
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,7168,2048,8,384,1,4,power_law_1.2,0.9108351707458496
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,7168,2048,8,384,1,4,power_law_1.2,0.9684864044189453
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,7168,2048,8,384,1,4,power_law_1.2,1.0886336326599122
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,7168,2048,8,384,1,4,power_law_1.2,1.2025343894958496
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,7168,2048,8,384,1,4,power_law_1.2,1.4948415756225586
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,7168,2048,8,384,1,4,power_law_1.2,1.446828842163086
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,7168,2048,8,384,1,4,power_law_1.2,1.835270309448242
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,7168,2048,8,384,1,4,power_law_1.2,2.073094367980957
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,7168,2048,8,384,1,4,power_law_1.2,2.6373952865600585
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,384,1,4,balanced,22.832438151041668
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,7168,2048,8,384,1,4,power_law_1.2,3.0110143661499023
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,7168,2048,8,384,1,4,power_law_1.2,3.7917823791503906
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,7168,2048,8,384,1,4,power_law_1.2,4.615001678466797
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,7168,2048,8,384,1,4,power_law_1.2,5.6064704895019535
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,7168,2048,8,384,1,4,power_law_1.2,8.155404663085937
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,7168,2048,8,384,1,4,power_law_1.2,0.15934079885482788
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,7168,2048,8,384,1,4,power_law_1.2,0.2318336009979248
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,7168,2048,8,384,1,4,power_law_1.2,15.322061157226562
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,7168,2048,8,384,1,4,power_law_1.2,0.2459968090057373
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,7168,2048,8,384,2,2,balanced,0.08849066495895386
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,7168,2048,8,384,1,4,power_law_1.2,0.1878592014312744
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,7168,2048,8,384,2,2,balanced,0.06586666901906331
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,7168,2048,8,384,2,2,balanced,0.12337066729863484
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,7168,2048,8,384,1,4,power_law_1.2,0.2936896085739136
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,7168,2048,8,384,2,2,balanced,0.2020960052808126
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,7168,2048,8,384,2,2,balanced,0.08513599634170532
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,7168,2048,8,384,2,2,balanced,0.3676533301671346
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,7168,2048,8,384,1,4,power_law_1.2,0.4066175937652588
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,7168,2048,8,384,2,2,balanced,0.6910613377888998
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,7168,2048,8,384,2,2,balanced,0.12552000085512796
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,7168,2048,8,384,2,2,balanced,1.334448019663493
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,7168,2048,8,384,1,4,power_law_1.2,0.44744319915771485
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,7168,2048,8,384,2,2,balanced,0.21200533707936606
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,7168,2048,8,384,2,2,balanced,1.9925440152486165
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,7168,2048,8,384,1,4,power_law_1.2,0.647872018814087
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,7168,2048,8,384,2,2,balanced,0.3736106554667155
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,7168,2048,8,384,2,2,balanced,1.9964319864908855
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,7168,2048,8,384,2,2,balanced,0.709658702214559
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,7168,2048,8,384,2,2,balanced,1.9912746747334797
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,7168,2048,8,384,1,4,power_law_1.2,0.7175936222076416
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,7168,2048,8,384,2,2,balanced,1.9881919225056965
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,7168,2048,8,384,2,2,balanced,1.0576746463775635
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,7168,2048,8,384,1,4,power_law_1.2,0.7052480220794678
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,7168,2048,8,384,2,2,balanced,1.9823840459187825
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,7168,2048,8,384,2,2,balanced,1.04640531539917
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,7168,2048,8,384,2,2,balanced,1.9989919662475586
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,7168,2048,8,384,1,4,power_law_1.2,0.7623807907104492
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,7168,2048,8,384,2,2,balanced,1.0505013465881348
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,7168,2048,8,384,2,2,balanced,2.0056373278299966
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,7168,2048,8,384,2,2,balanced,2.0093493461608887
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,7168,2048,8,384,2,2,balanced,1.0434506734212239
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,7168,2048,8,384,1,4,power_law_1.2,0.8012672424316406
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,7168,2048,8,384,2,2,balanced,2.024346669514974
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,7168,2048,8,384,2,2,balanced,1.055397351582845
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,7168,2048,8,384,1,4,power_law_1.2,0.8473855972290039
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,7168,2048,8,384,2,2,balanced,2.0371626218159995
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,7168,2048,8,384,2,2,balanced,1.0699040095011394
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,7168,2048,8,384,1,4,power_law_1.2,0.9631104469299316
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,7168,2048,8,384,2,2,balanced,2.0616745948791504
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,7168,2048,8,384,2,2,balanced,1.0945013364156086
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,7168,2048,8,384,2,2,balanced,2.093594710032145
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,7168,2048,8,384,1,4,power_law_1.2,1.0243647575378418
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,7168,2048,8,384,2,2,balanced,1.0834773381551106
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,7168,2048,8,384,2,2,balanced,0.107013334830602
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,7168,2048,8,384,2,2,balanced,2.16701873143514
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,7168,2048,8,384,1,4,power_law_1.2,1.0499967575073241
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,7168,2048,8,384,2,2,balanced,1.096239964167277
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,7168,2048,8,384,2,2,balanced,0.11999467015266418
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,7168,2048,8,384,2,2,balanced,2.263146718343099
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,7168,2048,8,384,1,4,power_law_1.2,1.1910207748413086
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,7168,2048,8,384,2,2,balanced,1.123311996459961
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,7168,2048,8,384,2,2,balanced,0.16119999686876932
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,7168,2048,8,384,2,2,balanced,0.23881600300470987
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,7168,2048,8,384,2,2,balanced,2.2947093645731607
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,7168,2048,8,384,2,2,balanced,1.1298879782358806
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,7168,2048,8,384,1,4,power_law_1.2,1.4235967636108398
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,7168,2048,8,384,2,2,balanced,0.39394664764404297
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,7168,2048,8,384,2,2,balanced,1.1571786403656006
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,7168,2048,8,384,2,2,balanced,0.71998397509257
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,7168,2048,8,384,2,2,balanced,2.422170639038086
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,7168,2048,8,384,2,2,balanced,1.0456586678822835
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,7168,2048,8,384,2,2,balanced,1.1920106410980225
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,384,1,4,power_law_1.2,1.4955519676208495
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,7168,2048,8,384,2,2,balanced,1.0509813626607258
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,7168,2048,8,384,2,2,balanced,2.620960076649984
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,7168,2048,8,384,2,2,balanced,1.2660053571065266
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,7168,2048,8,384,2,2,balanced,1.0547413031260173
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,7168,2048,8,384,2,2,balanced,1.05949862798055
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,384,1,4,power_law_1.2,1.480185604095459
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,7168,2048,8,384,2,2,balanced,1.3516000111897786
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,7168,2048,8,384,2,2,balanced,1.0662186940511067
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,7168,2048,8,384,2,2,balanced,2.87392520904541
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,384,1,4,power_law_1.2,1.7273216247558594
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,7168,2048,8,384,2,2,balanced,1.0766613483428955
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,7168,2048,8,384,2,2,balanced,1.482682704925537
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,384,1,4,power_law_1.2,2.359462356567383
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,7168,2048,8,384,2,2,balanced,1.083733320236206
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,384,1,4,power_law_1.2,2.456915283203125
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,7168,2048,8,384,2,2,power_law_1.01,0.13187839984893798
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,7168,2048,8,384,2,2,balanced,1.1006027062733967
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,7168,2048,8,384,2,2,balanced,1.6297225952148438
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,7168,2048,8,384,2,2,balanced,3.5634241104125977
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,384,1,4,power_law_1.2,3.464031982421875
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,7168,2048,8,384,2,2,power_law_1.01,0.1990399956703186
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,7168,2048,8,384,2,2,balanced,1.1232266426086426
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,7168,2048,8,384,2,2,power_law_1.01,0.08769919872283935
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,384,1,4,power_law_1.2,4.116108703613281
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,7168,2048,8,384,2,2,power_law_1.01,0.3638848066329956
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,7168,2048,8,384,2,2,balanced,1.1380266348520915
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,7168,2048,8,384,2,2,power_law_1.01,0.12346880435943604
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,7168,2048,8,384,2,2,power_law_1.01,0.29079039096832277
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,7168,2048,8,384,2,2,balanced,1.9137600262959797
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,7168,2048,8,384,2,2,balanced,1.1804373264312744
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,384,1,4,power_law_1.2,6.154438400268555
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,7168,2048,8,384,2,2,power_law_1.01,0.20480639934539796
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,7168,2048,8,384,2,2,power_law_1.01,0.511737585067749
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,7168,2048,8,384,2,2,balanced,1.2727146943410237
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,384,1,4,power_law_1.2,7.463775634765625
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,7168,2048,8,384,2,2,power_law_1.01,0.15872639417648315
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,7168,2048,8,384,2,2,balanced,4.060229301452637
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,7168,2048,8,384,2,2,power_law_1.01,0.785587215423584
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,7168,2048,8,384,2,2,power_law_1.01,0.29952640533447267
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,7168,2048,8,384,2,2,power_law_1.01,0.9744383811950683
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,384,1,4,power_law_1.2,9.873241424560547
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,7168,2048,8,384,2,2,balanced,2.491322676340739
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,7168,2048,8,384,2,2,power_law_1.01,0.44008960723876955
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,7168,2048,8,384,2,2,power_law_1.01,1.2146112442016601
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,7168,2048,8,384,2,2,power_law_1.01,0.4830143928527832
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,384,2,2,balanced,1.3806826273600261
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,7168,2048,8,384,2,2,power_law_1.01,1.2827072143554688
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,384,1,4,power_law_1.2,15.389152526855469
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,7168,2048,8,384,2,2,power_law_1.01,0.6567423820495606
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,7168,2048,8,384,2,2,power_law_1.01,1.4090496063232423
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,7168,2048,8,384,2,2,power_law_1.01,0.7276351928710938
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,7168,2048,8,384,2,2,power_law_1.01,1.4645055770874023
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,7168,2048,8,384,2,2,balanced,5.484794616699219
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,384,1,4,power_law_1.2,28.080166625976563
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,7168,2048,8,384,2,2,power_law_1.01,0.7338560104370118
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,7168,2048,8,384,2,2,power_law_1.01,1.4839808464050293
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,7168,2048,8,384,2,2,balanced,2.991898536682129
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,7168,2048,8,384,2,2,power_law_1.01,1.555884838104248
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,7168,2048,8,384,2,2,power_law_1.01,0.751251220703125
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,7168,2048,8,384,2,2,power_law_1.01,1.5647744178771972
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,7168,2048,8,384,2,2,power_law_1.01,0.7916416168212891
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,384,2,2,balanced,1.5631200472513835
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,7168,2048,8,384,2,2,power_law_1.01,1.6629951477050782
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,7168,2048,8,384,2,2,power_law_1.01,0.8075455665588379
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,7168,2048,8,384,2,2,power_law_1.01,1.6432256698608398
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,384,2,2,balanced,1.7159199714660645
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,7168,2048,8,384,2,2,power_law_1.01,0.8627327919006348
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,7168,2048,8,384,2,2,power_law_1.01,1.768992042541504
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,7168,2048,8,384,2,2,power_law_1.01,0.9274304389953614
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,7168,2048,8,384,2,2,balanced,4.045562744140625
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,384,2,2,balanced,1.9806453386942546
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,7168,2048,8,384,2,2,power_law_1.01,1.8895423889160157
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,7168,2048,8,384,2,2,power_law_1.01,0.9824383735656739
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,7168,2048,8,384,2,2,balanced,7.069253285725911
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,7168,2048,8,384,2,2,power_law_1.01,2.0187200546264648
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,7168,2048,8,384,2,2,power_law_1.01,0.9353152275085449
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,384,2,2,balanced,2.4649227460225425
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,7168,2048,8,384,2,2,power_law_1.01,2.321766471862793
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,7168,2048,8,384,2,2,power_law_1.01,1.0372159957885743
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,7168,2048,8,384,2,2,power_law_1.01,2.5851200103759764
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,7168,2048,8,384,2,2,power_law_1.01,1.1814911842346192
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,7168,2048,8,384,2,2,power_law_1.01,3.315865707397461
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,7168,2048,8,384,2,2,power_law_1.01,1.431833553314209
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,384,2,2,balanced,3.030437469482422
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,7168,2048,8,384,2,2,power_law_1.01,2.858131217956543
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,7168,2048,8,384,2,2,power_law_1.01,1.3963839530944824
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,7168,2048,8,384,2,2,power_law_1.01,3.3634368896484377
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,7168,2048,8,384,2,2,power_law_1.01,1.7530879974365234
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,7168,2048,8,384,2,2,balanced,5.334927876790364
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,7168,2048,8,384,2,2,power_law_1.01,1.7300800323486327
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,7168,2048,8,384,2,2,power_law_1.01,4.6984703063964846
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,384,2,2,balanced,4.498714764912923
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,7168,2048,8,384,2,2,power_law_1.01,2.176972770690918
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,7168,2048,8,384,2,2,power_law_1.01,5.938457489013672
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,7168,2048,8,384,2,2,power_law_1.01,3.1161216735839843
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,7168,2048,8,384,2,2,power_law_1.01,6.6138557434082035
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,7168,2048,8,384,2,2,power_law_1.01,3.9104190826416017
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,7168,2048,8,384,2,2,balanced,10.393360137939453
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,7168,2048,8,384,2,2,power_law_1.01,8.079334259033203
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,7168,2048,8,384,2,2,power_law_1.01,4.772268676757813
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,384,2,2,balanced,5.701215744018555
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,7168,2048,8,384,2,2,power_law_1.01,12.211910247802734
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,7168,2048,8,384,2,2,power_law_1.01,5.643494415283203
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,7168,2048,8,384,2,2,power_law_1.01,8.295174407958985
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,7168,2048,8,384,2,2,power_law_1.01,22.81481018066406
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,7168,2048,8,384,2,2,power_law_1.01,0.1307584047317505
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,7168,2048,8,384,2,2,power_law_1.01,0.16899839639663697
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,7168,2048,8,384,2,2,power_law_1.01,16.120095825195314
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,7168,2048,8,384,2,2,balanced,7.5798187255859375
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,7168,2048,8,384,2,2,power_law_1.01,0.25137279033660886
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,384,2,2,balanced,7.984133402506511
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,7168,2048,8,384,2,2,power_law_1.01,0.2007040023803711
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,7168,2048,8,384,2,2,power_law_1.2,0.12066559791564942
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,7168,2048,8,384,2,2,power_law_1.01,0.3373823881149292
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,7168,2048,8,384,2,2,power_law_1.2,0.20113279819488525
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,7168,2048,8,384,2,2,power_law_1.01,0.45311360359191893
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,7168,2048,8,384,2,2,power_law_1.2,0.22499840259552
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,7168,2048,8,384,2,2,power_law_1.01,0.5300992012023926
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,7168,2048,8,384,2,2,power_law_1.2,0.28039040565490725
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,7168,2048,8,384,2,2,power_law_1.01,0.6738815784454346
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,7168,2048,8,384,2,2,power_law_1.2,0.4886655807495117
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,7168,2048,8,384,2,2,power_law_1.01,0.7230847835540771
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,7168,2048,8,384,2,2,power_law_1.2,0.6763328075408935
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,7168,2048,8,384,2,2,power_law_1.01,0.7431359767913819
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,384,2,2,balanced,10.278303782145182
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,7168,2048,8,384,2,2,power_law_1.2,0.8548352241516113
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,7168,2048,8,384,2,2,power_law_1.01,0.8036735534667969
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,7168,2048,8,384,2,2,power_law_1.2,1.1882431983947754
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,7168,2048,8,384,2,2,power_law_1.01,0.8279040336608887
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,7168,2048,8,384,2,2,power_law_1.2,1.2110015869140625
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,7168,2048,8,384,2,2,power_law_1.01,0.8529600143432617
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,7168,2048,8,384,2,2,power_law_1.2,1.332755184173584
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,7168,2048,8,384,2,2,power_law_1.01,0.9309951782226562
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,7168,2048,8,384,2,2,power_law_1.2,1.3951744079589843
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,7168,2048,8,384,2,2,power_law_1.01,1.009984016418457
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,7168,2048,8,384,2,2,power_law_1.2,1.4859456062316894
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,7168,2048,8,384,2,2,power_law_1.01,1.090777587890625
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,7168,2048,8,384,2,2,power_law_1.2,1.525376033782959
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,7168,2048,8,384,2,2,balanced,19.55361048380534
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,7168,2048,8,384,2,2,power_law_1.01,1.2059840202331542
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,7168,2048,8,384,2,2,power_law_1.2,1.550291156768799
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,7168,2048,8,384,2,2,power_law_1.01,1.4816384315490723
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,7168,2048,8,384,2,2,power_law_1.2,1.637343978881836
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,7168,2048,8,384,2,2,power_law_1.2,1.7023168563842774
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,7168,2048,8,384,2,2,power_law_1.2,1.7725696563720703
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,384,2,2,power_law_1.01,1.5514944076538086
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,384,2,2,balanced,15.764575958251953
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,7168,2048,8,384,2,2,power_law_1.2,1.9070400238037108
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,7168,2048,8,384,2,2,power_law_1.2,2.1161088943481445
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,384,2,2,power_law_1.01,1.6093759536743164
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,7168,2048,8,384,2,2,balanced,14.586410522460938
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,384,2,2,power_law_1.01,1.9038400650024414
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,7168,2048,8,384,2,2,power_law_1.2,2.442777633666992
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,384,2,2,power_law_1.01,2.420345687866211
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,7168,2048,8,384,2,2,power_law_1.2,2.760825538635254
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,384,2,2,power_law_1.01,2.786400032043457
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,7168,2048,8,384,2,2,power_law_1.2,3.5813438415527346
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,7168,2048,8,384,2,2,power_law_1.2,3.1192319869995115
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,384,2,2,power_law_1.01,3.6838783264160155
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,7168,2048,8,384,2,2,power_law_1.2,3.7581951141357424
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,384,2,2,power_law_1.01,4.6228992462158205
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,7168,2048,8,384,2,2,power_law_1.2,5.036524963378906
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,384,2,2,power_law_1.01,6.640486145019532
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,7168,2048,8,384,2,2,power_law_1.2,6.424550628662109
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,384,2,2,power_law_1.01,8.684146881103516
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,7168,2048,8,384,2,2,power_law_1.2,7.264627075195312
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,384,2,2,power_law_1.01,10.674105834960937
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,7168,2048,8,384,2,2,power_law_1.2,8.439730834960937
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,384,2,2,power_law_1.01,16.61900177001953
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,7168,2048,8,384,2,2,power_law_1.2,12.638988494873047
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,7168,2048,8,384,2,2,power_law_1.2,0.08792960047721862
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,7168,2048,8,384,2,2,power_law_1.2,23.213786315917968
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,384,2,2,power_law_1.01,33.35455322265625
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,7168,2048,8,384,2,2,power_law_1.2,0.12436480522155761
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,7168,2048,8,384,2,2,power_law_1.2,0.12432639598846436
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,7168,2048,8,384,2,2,power_law_1.2,0.1657855987548828
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,384,2,2,balanced,31.513099670410156
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,7168,2048,8,384,2,2,power_law_1.2,0.27381119728088377
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,7168,2048,8,384,2,2,power_law_1.2,0.37373440265655516
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,7168,2048,8,384,2,2,power_law_1.2,0.4415103912353516
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,7168,2048,8,384,2,2,power_law_1.2,0.6234047889709473
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,7168,2048,8,384,2,2,power_law_1.2,0.6602431774139405
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,7168,2048,8,384,2,2,power_law_1.2,0.6695680141448974
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,7168,2048,8,384,2,2,power_law_1.2,0.7429440021514893
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,7168,2048,8,384,2,2,power_law_1.2,0.7854144096374511
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,7168,2048,8,384,2,2,power_law_1.2,0.7687551975250244
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,7168,2048,8,384,2,2,power_law_1.2,0.864844799041748
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,7168,2048,8,384,2,2,power_law_1.2,0.9283391952514648
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,7168,2048,8,384,2,2,power_law_1.2,0.9836031913757324
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,7168,2048,8,384,2,2,power_law_1.2,0.9717696189880372
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,7168,2048,8,384,2,2,power_law_1.2,1.0587712287902833
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,7168,2048,8,384,2,2,power_law_1.2,1.2630335807800293
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,7168,2048,8,384,2,2,power_law_1.2,1.4482943534851074
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,7168,2048,8,384,2,2,power_law_1.2,1.490617561340332
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,7168,2048,8,384,2,2,power_law_1.2,1.7750656127929687
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,7168,2048,8,384,2,2,power_law_1.2,1.8088768005371094
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,7168,2048,8,384,4,1,balanced,0.09185600280761719
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,7168,2048,8,384,2,2,power_law_1.2,2.2864448547363283
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,7168,2048,8,384,4,1,balanced,0.1267253359158834
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,7168,2048,8,384,4,1,balanced,0.20350933074951172
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,7168,2048,8,384,2,2,power_law_1.2,0.12638720273971557
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,7168,2048,8,384,2,2,power_law_1.2,3.2190208435058594
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,7168,2048,8,384,4,1,balanced,0.3726079861323039
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,7168,2048,8,384,2,2,power_law_1.2,0.1690559983253479
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,7168,2048,8,384,4,1,balanced,0.7037866910298666
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,7168,2048,8,384,2,2,power_law_1.2,4.244454574584961
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,7168,2048,8,384,2,2,power_law_1.2,0.1746880054473877
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,7168,2048,8,384,4,1,balanced,1.33842134475708
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,7168,2048,8,384,2,2,power_law_1.2,0.1965824007987976
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,7168,2048,8,384,2,2,power_law_1.2,4.763513565063477
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,7168,2048,8,384,2,2,power_law_1.2,0.2722368001937866
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,7168,2048,8,384,4,1,balanced,2.0402933756510415
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,7168,2048,8,384,2,2,power_law_1.2,0.3857599973678589
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,7168,2048,8,384,4,1,balanced,2.010474681854248
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,7168,2048,8,384,2,2,power_law_1.2,5.718828964233398
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,7168,2048,8,384,2,2,power_law_1.2,0.472441577911377
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,7168,2048,8,384,4,1,balanced,2.012074629465739
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,7168,2048,8,384,2,2,power_law_1.2,0.6481664180755615
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,7168,2048,8,384,4,1,balanced,2.023039976755778
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,7168,2048,8,384,2,2,power_law_1.2,0.6854144096374511
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,7168,2048,8,384,2,2,power_law_1.2,9.257382202148438
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,7168,2048,8,384,4,1,balanced,2.013141314188639
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,7168,2048,8,384,2,2,power_law_1.2,0.7285568237304687
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,7168,2048,8,384,2,2,power_law_1.2,0.7417407989501953
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,7168,2048,8,384,4,1,balanced,2.024127960205078
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,7168,2048,8,384,2,2,power_law_1.2,0.8206720352172852
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,7168,2048,8,384,2,2,power_law_1.2,18.311212158203126
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,7168,2048,8,384,4,1,balanced,2.040640036265055
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,7168,2048,8,384,2,2,power_law_1.2,0.8653183937072754
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,7168,2048,8,384,4,1,balanced,2.0510613123575845
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,7168,2048,8,384,2,2,power_law_1.2,0.9437567710876464
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,7168,2048,8,384,2,2,power_law_1.2,1.0231616020202636
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,7168,2048,8,384,4,1,balanced,2.0646400451660156
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,7168,2048,8,384,2,2,power_law_1.2,1.0733951568603515
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,7168,2048,8,384,4,1,balanced,2.0741066932678223
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,7168,2048,8,384,2,2,power_law_1.2,1.2163711547851563
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,7168,2048,8,384,4,1,balanced,0.07113066812356313
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,7168,2048,8,384,2,2,power_law_1.2,1.5533632278442382
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,7168,2048,8,384,4,1,balanced,2.09661865234375
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,7168,2048,8,384,4,1,balanced,0.09009066224098206
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,7168,2048,8,384,4,1,balanced,0.13223466277122498
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,7168,2048,8,384,4,1,balanced,2.1517814000447593
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,384,2,2,power_law_1.2,1.5721407890319825
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,7168,2048,8,384,4,1,balanced,0.22249066829681396
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,7168,2048,8,384,4,1,balanced,2.2626880009969077
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,7168,2048,8,384,4,1,balanced,0.3959306478500366
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,7168,2048,8,384,4,1,balanced,0.7283946673075358
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,7168,2048,8,384,4,1,balanced,2.353274663289388
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,384,2,2,power_law_1.2,1.7030847549438477
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,7168,2048,8,384,4,1,balanced,1.0501226584116619
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,384,2,2,power_law_1.2,1.961529541015625
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,7168,2048,8,384,4,1,balanced,2.4736266136169434
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,7168,2048,8,384,4,1,balanced,1.0625546773274739
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,384,2,2,power_law_1.2,2.61648006439209
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,7168,2048,8,384,4,1,balanced,1.0655786991119385
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,384,2,2,power_law_1.2,2.967763137817383
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,7168,2048,8,384,4,1,balanced,1.0759039719899495
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,7168,2048,8,384,4,1,balanced,2.7088801066080728
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,384,2,2,power_law_1.2,3.965427017211914
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,7168,2048,8,384,4,1,balanced,1.0814346472422283
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,7168,2048,8,384,4,1,balanced,1.0874239603678386
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,384,2,2,power_law_1.2,4.787276840209961
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,7168,2048,8,384,4,1,balanced,1.1077813307444255
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,7168,2048,8,384,4,1,balanced,2.9789600372314453
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,384,2,2,power_law_1.2,6.831948852539062
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,7168,2048,8,384,4,1,balanced,1.133354663848877
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,7168,2048,8,384,4,1,balanced,1.1387466589609783
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,384,2,2,power_law_1.2,8.684416198730469
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,7168,2048,8,384,4,1,balanced,0.16847999890645346
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,7168,2048,8,384,4,1,balanced,1.1542773246765137
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,384,2,2,power_law_1.2,11.120780944824219
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,7168,2048,8,384,4,1,balanced,0.17964800198872885
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,7168,2048,8,384,4,1,balanced,3.4644479751586914
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,7168,2048,8,384,4,1,balanced,1.195039987564087
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,7168,2048,8,384,4,1,balanced,0.2157920002937317
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,7168,2048,8,384,4,1,balanced,1.2687466939290364
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,7168,2048,8,384,4,1,balanced,0.30932799975077313
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,384,2,2,power_law_1.2,18.542694091796875
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,7168,2048,8,384,4,1,balanced,0.46320533752441406
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,7168,2048,8,384,4,1,balanced,1.3091200192769368
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,7168,2048,8,384,4,1,balanced,0.8172480265299479
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,7168,2048,8,384,4,1,balanced,1.1737279891967773
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,7168,2048,8,384,4,1,balanced,4.308437347412109
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,7168,2048,8,384,4,1,balanced,1.416042645772298
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,384,2,2,power_law_1.2,33.03719787597656
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,7168,2048,8,384,4,1,balanced,1.1698826948801677
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,7168,2048,8,384,4,1,balanced,1.1808640162150066
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,7168,2048,8,384,4,1,balanced,1.540181318918864
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,7168,2048,8,384,4,1,balanced,1.1892000039418538
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,7168,2048,8,384,4,1,balanced,1.2099093596140544
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,7168,2048,8,384,4,1,balanced,1.2253066698710124
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,7168,2048,8,384,4,1,balanced,1.7618560791015625
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,7168,2048,8,384,4,1,balanced,1.237056016921997
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,7168,2048,8,384,4,1,balanced,5.118085225423177
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,7168,2048,8,384,4,1,balanced,1.272655963897705
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,7168,2048,8,384,4,1,balanced,1.9740160306294758
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,7168,2048,8,384,4,1,balanced,1.3133333524068196
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,7168,2048,8,384,4,1,balanced,1.351029396057129
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,7168,2048,8,384,4,1,balanced,1.4222559928894043
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,7168,2048,8,384,4,1,balanced,2.411685307820638
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,7168,2048,8,384,4,1,balanced,1.5716053644816081
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,7168,2048,8,384,4,1,power_law_1.01,0.0883072018623352
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,7168,2048,8,384,4,1,balanced,6.768416086832683
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,7168,2048,8,384,4,1,power_law_1.01,0.06835200190544129
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,7168,2048,8,384,4,1,power_law_1.01,0.12654080390930175
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,7168,2048,8,384,4,1,balanced,3.1645921071370444
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,7168,2048,8,384,4,1,power_law_1.01,0.2041856050491333
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,7168,2048,8,384,4,1,power_law_1.01,0.08634880185127258
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,384,4,1,balanced,1.7173333168029785
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,7168,2048,8,384,4,1,power_law_1.01,0.26629760265350344
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,7168,2048,8,384,4,1,power_law_1.01,0.12858879566192627
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,7168,2048,8,384,4,1,power_law_1.01,0.1523967981338501
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,7168,2048,8,384,4,1,power_law_1.01,0.5123456001281739
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,7168,2048,8,384,4,1,power_law_1.01,0.16437760591506959
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,7168,2048,8,384,4,1,power_law_1.01,0.1753216028213501
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,7168,2048,8,384,4,1,power_law_1.01,0.7852159976959229
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,7168,2048,8,384,4,1,power_law_1.01,0.29348480701446533
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,7168,2048,8,384,4,1,power_law_1.01,0.22081279754638672
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,7168,2048,8,384,4,1,power_law_1.01,0.955622386932373
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,7168,2048,8,384,4,1,power_law_1.01,0.43203201293945315
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,7168,2048,8,384,4,1,balanced,4.085418701171875
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,7168,2048,8,384,4,1,power_law_1.01,0.24685440063476563
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,7168,2048,8,384,4,1,power_law_1.01,1.2699520111083984
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,7168,2048,8,384,4,1,power_law_1.01,0.508896017074585
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,384,4,1,balanced,2.1177919705708823
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,7168,2048,8,384,4,1,power_law_1.01,0.3712703943252563
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,7168,2048,8,384,4,1,balanced,9.019599914550781
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,7168,2048,8,384,4,1,power_law_1.01,1.283743953704834
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,7168,2048,8,384,4,1,power_law_1.01,0.664134407043457
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,7168,2048,8,384,4,1,power_law_1.01,0.5067647933959961
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,384,4,1,balanced,2.4202879269917807
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,7168,2048,8,384,4,1,power_law_1.01,1.3436415672302247
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,7168,2048,8,384,4,1,power_law_1.01,0.7140416145324707
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,7168,2048,8,384,4,1,power_law_1.01,0.5954751968383789
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,7168,2048,8,384,4,1,power_law_1.01,1.403711986541748
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,7168,2048,8,384,4,1,power_law_1.01,0.7438208103179932
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,7168,2048,8,384,4,1,power_law_1.01,0.7751743793487549
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,384,4,1,balanced,2.8708693186442056
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,7168,2048,8,384,4,1,power_law_1.01,1.477932834625244
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,7168,2048,8,384,4,1,power_law_1.01,0.8008768081665039
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,7168,2048,8,384,4,1,power_law_1.01,0.8019840240478515
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,7168,2048,8,384,4,1,balanced,5.257823944091797
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,7168,2048,8,384,4,1,power_law_1.01,0.8195775985717774
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,7168,2048,8,384,4,1,power_law_1.01,1.5413248062133789
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,7168,2048,8,384,4,1,power_law_1.01,0.829593563079834
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,7168,2048,8,384,4,1,power_law_1.01,1.5775360107421874
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,7168,2048,8,384,4,1,power_law_1.01,0.8531328201293945
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,7168,2048,8,384,4,1,power_law_1.01,0.8783616065979004
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,384,4,1,balanced,3.6511414845784507
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,7168,2048,8,384,4,1,power_law_1.01,1.6713983535766601
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,7168,2048,8,384,4,1,power_law_1.01,0.8970496177673339
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,7168,2048,8,384,4,1,power_law_1.01,0.9311615943908691
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,7168,2048,8,384,4,1,power_law_1.01,1.7296384811401366
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,7168,2048,8,384,4,1,power_law_1.01,0.950931167602539
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,7168,2048,8,384,4,1,power_law_1.01,0.9701055526733399
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,7168,2048,8,384,4,1,power_law_1.01,1.7579456329345704
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,7168,2048,8,384,4,1,power_law_1.01,1.0027968406677246
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,384,4,1,balanced,4.621935844421387
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,7168,2048,8,384,4,1,power_law_1.01,1.03951997756958
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,7168,2048,8,384,4,1,power_law_1.01,1.974790382385254
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,7168,2048,8,384,4,1,power_law_1.01,1.0286784172058105
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,7168,2048,8,384,4,1,power_law_1.01,1.144812774658203
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,7168,2048,8,384,4,1,balanced,13.011700948079428
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,7168,2048,8,384,4,1,power_law_1.01,2.1074880599975585
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,7168,2048,8,384,4,1,power_law_1.01,1.1737471580505372
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,7168,2048,8,384,4,1,power_law_1.01,1.221446418762207
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,7168,2048,8,384,4,1,balanced,6.74293835957845
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,7168,2048,8,384,4,1,power_law_1.01,2.4391231536865234
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,7168,2048,8,384,4,1,power_law_1.01,1.3003840446472168
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,7168,2048,8,384,4,1,power_law_1.01,1.3914560317993163
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,384,4,1,balanced,6.6353759765625
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,7168,2048,8,384,4,1,power_law_1.01,2.6680576324462892
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,7168,2048,8,384,4,1,power_law_1.01,1.5864895820617675
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,7168,2048,8,384,4,1,power_law_1.01,1.7207168579101562
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,7168,2048,8,384,4,1,power_law_1.01,3.3149375915527344
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,7168,2048,8,384,4,1,power_law_1.01,1.6188800811767579
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,7168,2048,8,384,4,1,power_law_1.01,2.9956287384033202
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,7168,2048,8,384,4,1,power_law_1.01,1.9823616027832032
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,384,4,1,power_law_1.01,1.7884159088134766
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,7168,2048,8,384,4,1,power_law_1.01,3.680575942993164
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,7168,2048,8,384,4,1,power_law_1.01,2.0541568756103517
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,7168,2048,8,384,4,1,power_law_1.01,4.776147079467774
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,7168,2048,8,384,4,1,power_law_1.01,2.6446847915649414
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,384,4,1,balanced,8.75277328491211
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,384,4,1,power_law_1.01,2.0684864044189455
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,7168,2048,8,384,4,1,power_law_1.01,6.239328002929687
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,7168,2048,8,384,4,1,power_law_1.01,3.382547378540039
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,384,4,1,power_law_1.01,2.4723840713500977
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,7168,2048,8,384,4,1,power_law_1.01,4.5809471130371096
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,7168,2048,8,384,4,1,power_law_1.01,7.739174652099609
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,384,4,1,power_law_1.01,3.2560638427734374
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,7168,2048,8,384,4,1,power_law_1.01,5.61739501953125
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,7168,2048,8,384,4,1,power_law_1.01,9.343660736083985
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,384,4,1,power_law_1.01,3.789158248901367
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,7168,2048,8,384,4,1,balanced,10.276122411092123
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,7168,2048,8,384,4,1,power_law_1.01,6.8581695556640625
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,384,4,1,power_law_1.01,5.182899093627929
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,7168,2048,8,384,4,1,power_law_1.01,13.906137084960937
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,384,4,1,power_law_1.01,6.614937591552734
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,7168,2048,8,384,4,1,power_law_1.01,10.388909149169923
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,384,4,1,balanced,12.066090901692709
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,7168,2048,8,384,4,1,power_law_1.2,0.08872960209846496
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,384,4,1,power_law_1.01,9.399436950683594
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,7168,2048,8,384,4,1,power_law_1.01,27.6776123046875
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,7168,2048,8,384,4,1,power_law_1.2,0.12643200159072876
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,7168,2048,8,384,4,1,power_law_1.01,21.37494354248047
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,7168,2048,8,384,4,1,power_law_1.2,0.15639040470123292
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,384,4,1,power_law_1.01,12.229792022705078
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,7168,2048,8,384,4,1,power_law_1.2,0.272492790222168
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,384,4,1,power_law_1.01,15.030143737792969
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,7168,2048,8,384,4,1,power_law_1.2,0.4470719814300537
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,7168,2048,8,384,4,1,power_law_1.2,0.7049471855163574
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,7168,2048,8,384,4,1,balanced,25.37176005045573
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,384,4,1,power_law_1.01,23.459059143066405
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,7168,2048,8,384,4,1,power_law_1.2,0.815123176574707
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,7168,2048,8,384,4,1,power_law_1.2,1.1765952110290527
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,384,4,1,balanced,15.246159871419271
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,7168,2048,8,384,4,1,power_law_1.2,1.2595264434814453
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,7168,2048,8,384,4,1,power_law_1.2,1.328934383392334
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,384,4,1,power_law_1.01,46.221823120117186
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,7168,2048,8,384,4,1,power_law_1.2,1.3574015617370605
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,7168,2048,8,384,4,1,power_law_1.2,1.4530495643615722
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,7168,2048,8,384,4,1,power_law_1.2,1.4799488067626954
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,7168,2048,8,384,4,1,power_law_1.2,1.5863167762756347
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,7168,2048,8,384,4,1,power_law_1.2,1.6606527328491212
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,7168,2048,8,384,4,1,power_law_1.2,1.7322559356689453
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,7168,2048,8,384,4,1,balanced,19.388858795166016
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,7168,2048,8,384,4,1,power_law_1.2,1.7882944107055665
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,7168,2048,8,384,4,1,power_law_1.2,0.06661760210990905
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,7168,2048,8,384,4,1,power_law_1.2,2.045369529724121
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,384,4,1,balanced,23.86303965250651
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,7168,2048,8,384,4,1,power_law_1.2,0.08633599877357483
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,7168,2048,8,384,4,1,power_law_1.2,2.1799999237060548
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,7168,2048,8,384,4,1,power_law_1.2,0.10539519786834717
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,7168,2048,8,384,4,1,power_law_1.2,2.5321727752685548
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,7168,2048,8,384,4,1,power_law_1.2,0.16767359972000123
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,7168,2048,8,384,4,1,power_law_1.2,2.8743743896484375
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,7168,2048,8,384,4,1,power_law_1.2,0.2596224069595337
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,7168,2048,8,384,4,1,power_law_1.2,3.566022491455078
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,7168,2048,8,384,4,1,power_law_1.2,0.3864448070526123
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,7168,2048,8,384,4,1,power_law_1.2,3.1980607986450194
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,7168,2048,8,384,4,1,power_law_1.2,0.45145602226257325
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,7168,2048,8,384,4,1,power_law_1.2,3.9597824096679686
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,7168,2048,8,384,4,1,power_law_1.2,0.6276735782623291
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,7168,2048,8,384,4,1,power_law_1.2,5.039436721801758
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,7168,2048,8,384,4,1,power_law_1.2,0.6852416038513184
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,7168,2048,8,384,4,1,power_law_1.2,6.467225646972656
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,7168,2048,8,384,4,1,power_law_1.2,0.7227776050567627
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,7168,2048,8,384,4,1,power_law_1.2,7.999443054199219
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,7168,2048,8,384,4,1,power_law_1.2,0.7525248050689697
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,7168,2048,8,384,4,1,power_law_1.2,0.7975359916687011
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,7168,2048,8,384,4,1,power_law_1.2,0.8238975524902343
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,7168,2048,8,384,4,1,power_law_1.2,9.471155548095703
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,7168,2048,8,384,4,1,power_law_1.2,0.9055232048034668
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,7168,2048,8,384,4,1,power_law_1.2,14.269593811035156
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,7168,2048,8,384,4,1,power_law_1.2,0.9505599975585938
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,7168,2048,8,384,4,1,power_law_1.2,1.0149439811706542
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,7168,2048,8,384,4,1,power_law_1.2,1.0690239906311034
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,7168,2048,8,384,4,1,power_law_1.2,27.836569213867186
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,7168,2048,8,384,4,1,power_law_1.2,1.2176192283630372
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,7168,2048,8,384,4,1,power_law_1.2,1.334169578552246
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,7168,2048,8,384,4,1,power_law_1.2,1.6159807205200196
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,384,4,1,balanced,47.34991455078125
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,7168,2048,8,384,4,1,power_law_1.2,1.703603172302246
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,7168,2048,8,384,4,1,power_law_1.2,2.0676799774169923
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,7168,2048,8,384,4,1,power_law_1.2,2.1359167098999023
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,7168,2048,8,384,4,1,power_law_1.2,2.6888959884643553
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,7168,2048,8,384,4,1,power_law_1.2,3.547078323364258
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,7168,2048,8,384,4,1,power_law_1.2,4.756927871704102
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,7168,2048,8,384,4,1,power_law_1.2,5.7136894226074215
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,7168,2048,8,384,4,1,power_law_1.2,6.89315185546875
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,7168,2048,8,384,4,1,power_law_1.2,10.52265625
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,7168,2048,8,384,4,1,power_law_1.2,21.554412841796875
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,128,1,4,balanced,0.057999998331069946
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,128,1,4,balanced,0.06844266752401988
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,128,1,4,balanced,0.0795360008875529
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,128,1,4,balanced,0.0860746701558431
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,128,1,4,balanced,0.11521599690119426
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,128,1,4,balanced,0.18146665891011557
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,128,1,4,power_law_1.01,0.10265599489212036
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,128,1,4,power_law_1.2,0.10129280090332031
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,128,1,4,balanced,0.18209600448608398
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,128,1,4,power_law_1.01,0.12591999769210815
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,128,1,4,balanced,0.18344533443450928
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,128,1,4,power_law_1.2,0.1272704005241394
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,128,1,4,power_law_1.01,0.09939200282096863
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,128,1,4,balanced,0.18267732858657837
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,128,1,4,power_law_1.01,0.08994560241699219
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,128,1,4,power_law_1.2,0.09085440039634704
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,128,1,4,balanced,0.18316266934076944
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,128,1,4,power_law_1.01,0.10652159452438355
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,128,1,4,power_law_1.2,0.09011200070381165
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,7168,2048,8,384,4,1,power_law_1.2,0.15283199548721313
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,128,1,4,balanced,0.18408532937367758
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,128,1,4,power_law_1.01,0.1187391996383667
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,128,1,4,power_law_1.2,0.09031680226325989
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,128,1,4,balanced,0.21009065707524618
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,7168,2048,8,384,4,1,power_law_1.2,0.17543679475784302
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,128,1,4,power_law_1.01,0.14536960124969484
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,128,1,4,power_law_1.2,0.11306240558624267
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,7168,2048,8,384,4,1,power_law_1.2,0.21444480419158934
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,128,1,4,balanced,0.21099199851353964
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,128,1,4,power_law_1.01,0.1530176043510437
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,128,1,4,power_law_1.2,0.1427072048187256
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,7168,2048,8,384,4,1,power_law_1.2,0.24365439414978027
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,7168,2048,8,384,4,1,power_law_1.2,0.3315903902053833
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,128,1,4,balanced,0.21030400196711221
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,128,1,4,power_law_1.01,0.15568000078201294
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,128,1,4,power_law_1.2,0.1354367971420288
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,7168,2048,8,384,4,1,power_law_1.2,0.45969281196594236
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,128,1,4,balanced,0.26653865973154706
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,128,1,4,power_law_1.01,0.16300159692764282
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,128,1,4,power_law_1.2,0.14648959636688233
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,7168,2048,8,384,4,1,power_law_1.2,0.5251391887664795
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,128,1,4,balanced,0.2677599986394246
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,128,1,4,power_law_1.01,0.16228480339050294
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,7168,2048,8,384,4,1,power_law_1.2,0.7205567836761475
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,128,1,4,power_law_1.2,0.15992319583892822
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,7168,2048,8,384,4,1,power_law_1.2,0.7541440010070801
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,128,1,4,balanced,0.26893333594004315
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,128,1,4,power_law_1.01,0.18101119995117188
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,128,1,4,power_law_1.2,0.17241599559783935
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,7168,2048,8,384,4,1,power_law_1.2,0.7984576225280762
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,128,1,4,power_law_1.01,0.1869439959526062
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,128,1,4,balanced,0.5401920080184937
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,128,1,4,power_law_1.2,0.18721920251846313
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,7168,2048,8,384,4,1,power_law_1.2,0.867859172821045
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,128,2,2,balanced,0.057071998715400696
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,7168,2048,8,384,4,1,power_law_1.2,0.9214847564697266
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,128,1,4,power_law_1.01,0.19396480321884155
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,128,1,4,balanced,0.5432373285293579
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,128,1,4,power_law_1.2,0.19370880126953124
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,7168,2048,8,384,4,1,power_law_1.2,0.9798015594482422
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,128,1,4,power_law_1.01,0.2577536106109619
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,128,1,4,power_law_1.2,0.20392959117889403
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,128,2,2,balanced,0.06193066636721293
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,7168,2048,8,384,4,1,power_law_1.2,1.0684096336364746
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,128,1,4,balanced,0.5521440108617147
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,128,1,4,power_law_1.01,0.2549504041671753
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,128,1,4,power_law_1.2,0.2682368040084839
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,7168,2048,8,384,4,1,power_law_1.2,1.175929641723633
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,128,1,4,balanced,0.5575840075810751
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,128,1,4,power_law_1.01,0.28215680122375486
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,7168,2048,8,384,4,1,power_law_1.2,1.2495936393737792
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,128,1,4,power_law_1.2,0.2729919910430908
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,128,1,4,balanced,0.5774453481038412
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,128,2,2,balanced,0.08242666721343994
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,7168,2048,8,384,4,1,power_law_1.2,1.431987190246582
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,128,1,4,power_law_1.01,0.5565951824188232
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,128,1,4,power_law_1.2,0.3077375888824463
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,128,2,2,balanced,0.09240532914797465
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,7168,2048,8,384,4,1,power_law_1.2,1.7481664657592773
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,128,1,4,power_law_1.01,0.5749120235443115
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,128,1,4,power_law_1.2,0.6127423763275146
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,128,1,4,balanced,0.5995093186696371
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,128,2,2,balanced,0.10940266648928325
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,128,1,4,power_law_1.01,0.6736127853393554
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,128,2,2,balanced,0.18524267276128134
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,128,1,4,power_law_1.2,0.6372799873352051
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,384,4,1,power_law_1.2,1.8348928451538087
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,128,1,4,power_law_1.01,0.765721607208252
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,128,2,2,balanced,0.1858560045560201
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,128,1,4,power_law_1.2,0.7029183864593506
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,128,1,4,balanced,1.1044159730275471
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,128,2,2,balanced,0.18694400787353516
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,128,1,4,power_law_1.01,0.8935680389404297
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,128,1,4,power_law_1.2,0.7853312015533447
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,128,2,2,balanced,0.18677333990732828
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,128,1,4,power_law_1.01,1.0885567665100098
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,384,4,1,power_law_1.2,2.1487232208251954
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,128,1,4,power_law_1.2,0.9765439987182617
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,128,2,2,balanced,0.18708266814549765
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,128,1,4,balanced,1.147823969523112
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,384,4,1,power_law_1.2,2.5256128311157227
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,128,1,4,power_law_1.01,1.439072036743164
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,128,2,2,balanced,0.18799465894699097
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,128,1,4,power_law_1.2,1.2344191551208497
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,384,4,1,power_law_1.2,3.28430061340332
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,128,1,4,power_law_1.01,1.895462417602539
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,128,2,2,balanced,0.18819733460744223
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,128,1,4,power_law_1.2,1.560927963256836
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,384,4,1,power_law_1.2,3.8864959716796874
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,128,2,2,balanced,0.18842132886250815
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,128,1,4,power_law_1.01,2.571232032775879
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,128,1,4,balanced,1.7030347188313801
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,128,2,2,balanced,0.18950400749842325
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,128,1,4,power_law_1.2,2.0084543228149414
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,384,4,1,power_law_1.2,5.310617446899414
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,128,1,4,power_law_1.01,3.1633344650268556
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,128,2,2,balanced,0.21644800901412964
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,384,4,1,power_law_1.2,6.673907470703125
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,128,1,4,power_law_1.2,2.7847360610961913
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,128,2,2,balanced,0.21806933482487997
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,128,1,4,power_law_1.01,4.049401473999024
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,128,2,2,balanced,0.2198186715443929
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,128,1,4,power_law_1.2,3.6993663787841795
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,384,4,1,power_law_1.2,9.471250915527344
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,128,2,2,power_law_1.2,0.07199360132217407
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,128,1,4,power_law_1.01,6.432377624511719
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,128,2,2,power_law_1.01,0.07182080149650574
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,128,1,4,balanced,2.2512853940327964
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,128,2,2,balanced,0.2841866612434387
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,128,1,4,power_law_1.2,4.46550407409668
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,128,2,2,power_law_1.2,0.08807039856910706
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,384,4,1,power_law_1.2,12.233280181884766
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,128,2,2,power_law_1.01,0.08958719968795777
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,128,2,2,balanced,0.28701867659886676
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,128,1,4,power_law_1.01,13.979743957519531
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,128,2,2,power_law_1.2,0.07870720028877258
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,128,1,4,power_law_1.2,6.964230346679687
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,128,2,2,power_law_1.01,0.08817920088768005
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,128,2,2,balanced,0.5867253144582113
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,128,2,2,power_law_1.2,0.08988800048828124
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,384,4,1,power_law_1.2,15.038726806640625
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,128,2,2,power_law_1.01,0.09160320162773132
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,128,2,2,balanced,0.5928320089975992
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,128,2,2,power_law_1.2,0.08568320274353028
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,128,1,4,power_law_1.2,15.510214233398438
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,128,1,4,balanced,2.8129653930664062
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,128,2,2,power_law_1.01,0.09151359796524047
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,128,2,2,power_law_1.2,0.10158079862594604
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,128,2,2,balanced,0.6127680142720541
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,384,4,1,power_law_1.2,23.563462829589845
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,128,2,2,power_law_1.01,0.11699839830398559
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,128,2,2,power_law_1.2,0.1462656021118164
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,128,2,2,balanced,0.634879986445109
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,128,2,2,power_law_1.01,0.143231999874115
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,128,2,2,power_law_1.2,0.14929280281066895
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,128,2,2,power_law_1.01,0.15137920379638672
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,128,2,2,power_law_1.2,0.15199999809265136
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,128,2,2,balanced,1.1777866681416829
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,384,4,1,power_law_1.2,46.204550170898436
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,128,2,2,power_law_1.01,0.1537600040435791
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,128,2,2,power_law_1.2,0.1565119981765747
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,128,2,2,power_law_1.2,0.17285120487213135
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,128,2,2,power_law_1.01,0.1613312005996704
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,128,1,4,balanced,4.473269462585449
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,128,2,2,balanced,1.2245439688364665
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,128,2,2,power_law_1.2,0.18911999464035034
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,128,2,2,power_law_1.01,0.1664576053619385
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,128,2,2,power_law_1.2,0.1929152011871338
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,128,2,2,power_law_1.01,0.17690240144729613
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,128,2,2,power_law_1.2,0.21099519729614258
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,128,2,2,power_law_1.01,0.18600319623947142
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,128,2,2,balanced,1.8119786580403645
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,128,2,2,power_law_1.2,0.22294399738311768
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,128,2,2,power_law_1.01,0.20711040496826172
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,128,2,2,power_law_1.2,0.24488320350646972
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,128,2,2,power_law_1.01,0.21244800090789795
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,128,2,2,power_law_1.2,0.26777598857879636
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,128,2,2,power_law_1.01,0.22958719730377197
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,128,2,2,power_law_1.2,0.335699200630188
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,128,2,2,power_law_1.01,0.25730559825897215
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,128,2,2,balanced,2.400005340576172
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,128,2,2,power_law_1.01,0.3234623908996582
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,128,4,1,balanced,0.03301866600910822
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,128,2,2,power_law_1.2,0.3828288078308105
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,128,2,2,power_law_1.01,0.3558464050292969
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,128,2,2,power_law_1.2,0.7484288215637207
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,128,4,1,balanced,0.040149333576361336
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,128,4,1,balanced,0.05303466816743215
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,128,2,2,power_law_1.2,0.797983980178833
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,128,2,2,power_law_1.01,0.6856704235076905
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,128,4,1,balanced,0.08227733274300893
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,128,2,2,power_law_1.2,0.9590399742126465
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,128,2,2,power_law_1.01,0.7671679973602294
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,128,2,2,balanced,2.9923680623372397
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,128,1,4,balanced,8.872175852457682
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,128,2,2,power_law_1.2,1.1755135536193848
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,128,2,2,power_law_1.01,0.9247615814208985
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,128,4,1,balanced,0.11456533273061116
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,128,2,2,power_law_1.2,1.4323455810546875
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,128,2,2,power_law_1.01,1.0899264335632324
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,128,4,1,balanced,0.18396800756454468
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,128,2,2,power_law_1.2,1.7724607467651368
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,128,4,1,balanced,0.1856373349825541
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,128,2,2,power_law_1.01,1.3806912422180175
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,128,2,2,power_law_1.2,2.4584192276000976
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,128,4,1,balanced,0.18598399559656778
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,128,2,2,power_law_1.01,1.752569580078125
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,128,4,1,balanced,0.18681599696477255
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,128,2,2,power_law_1.2,3.265971374511719
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,128,2,2,balanced,4.751824061075847
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,128,4,1,balanced,0.18609066804250082
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,128,2,2,power_law_1.01,2.3907072067260744
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,128,2,2,power_law_1.2,4.134291076660157
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,128,4,1,balanced,0.18631466229756674
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,128,2,2,power_law_1.01,3.0189888000488283
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,128,2,2,power_law_1.2,6.300940704345703
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,128,4,1,balanced,0.1872373421986898
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,128,2,2,power_law_1.01,3.5142017364501954
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,128,2,2,power_law_1.2,11.699967956542968
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,128,4,1,balanced,0.18766399224599203
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,128,2,2,power_law_1.01,5.847686386108398
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,128,4,1,balanced,0.188426673412323
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,128,4,1,balanced,0.19010667006174722
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,128,2,2,power_law_1.01,11.025785827636719
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,128,4,1,balanced,0.1911946733792623
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,128,4,1,balanced,0.1936053236325582
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,128,4,1,balanced,0.22738667329152426
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,128,4,1,balanced,0.23303999503453574
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,128,2,2,balanced,9.439072291056315
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,128,4,1,balanced,0.3121760090192159
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,128,4,1,balanced,0.32309333483378094
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,128,4,1,balanced,0.646074652671814
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,128,4,1,balanced,0.6712000370025635
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,128,4,1,balanced,1.234826644261678
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,128,4,1,balanced,1.2851466337839763
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,128,4,1,balanced,1.8969066937764485
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,128,4,1,power_law_1.01,0.032358399033546446
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,128,4,1,balanced,2.5108906428019204
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,128,4,1,power_law_1.01,0.03871999979019165
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,128,4,1,power_law_1.01,0.04527359902858734
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,128,4,1,power_law_1.01,0.0702015995979309
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,128,4,1,power_law_1.01,0.08442879915237426
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,128,4,1,power_law_1.01,0.10092159509658813
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,128,4,1,balanced,3.117834726969401
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,128,4,1,power_law_1.01,0.13288320302963258
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,128,4,1,power_law_1.2,0.03249920010566711
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,128,4,1,power_law_1.01,0.13904000520706178
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,128,4,1,power_law_1.01,0.1482751965522766
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,128,4,1,power_law_1.2,0.03828479945659637
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,128,4,1,power_law_1.01,0.1557760000228882
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,128,4,1,power_law_1.2,0.04544639885425568
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,128,4,1,power_law_1.01,0.1592512011528015
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,128,4,1,power_law_1.2,0.06534399986267089
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,128,4,1,power_law_1.01,0.1700096011161804
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,128,4,1,power_law_1.2,0.08050559759140015
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,128,4,1,balanced,4.946175893147786
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,128,4,1,power_law_1.01,0.1811903953552246
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,128,4,1,power_law_1.2,0.0940671980381012
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,128,4,1,power_law_1.01,0.1970752000808716
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,128,4,1,power_law_1.2,0.13285759687423707
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,128,4,1,power_law_1.01,0.21615359783172608
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,128,4,1,power_law_1.2,0.13873280286788942
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,32,1,4,balanced,0.06049066781997681
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,128,4,1,power_law_1.01,0.23560960292816163
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,128,4,1,power_law_1.2,0.1493824005126953
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,128,4,1,power_law_1.01,0.2721407890319824
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,128,4,1,power_law_1.2,0.1533951997756958
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,32,1,4,balanced,0.06657599906126659
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,128,4,1,power_law_1.01,0.28996479511260986
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,128,4,1,power_law_1.2,0.16081279516220093
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,128,4,1,power_law_1.2,0.16860159635543823
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,128,4,1,power_law_1.01,0.3405247926712036
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,32,1,4,balanced,0.07814399898052216
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,128,4,1,power_law_1.2,0.1839743971824646
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,128,4,1,power_law_1.01,0.4219840049743652
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,128,4,1,power_law_1.2,0.20609920024871825
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,128,4,1,power_law_1.01,0.48071041107177737
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,128,4,1,power_law_1.01,0.903872013092041
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,128,4,1,power_law_1.2,0.22485759258270263
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,32,1,4,balanced,0.07374399900436401
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,128,4,1,power_law_1.2,0.24595839977264405
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,128,4,1,power_law_1.01,1.047116756439209
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,128,4,1,balanced,9.844042460123697
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,128,4,1,power_law_1.2,0.2894975900650024
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,128,4,1,power_law_1.01,1.3630399703979492
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,32,1,4,power_law_1.01,0.08568320274353028
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,128,4,1,power_law_1.2,0.30621440410614015
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,128,4,1,power_law_1.01,1.6561023712158203
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,32,1,4,balanced,0.0735040009021759
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,32,1,4,power_law_1.01,0.08967040181159973
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,128,4,1,power_law_1.2,0.3491391897201538
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,128,4,1,power_law_1.01,2.26943359375
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,32,1,4,power_law_1.01,0.09570559859275818
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,32,1,4,balanced,0.08098133405049641
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,128,4,1,power_law_1.2,0.43654398918151854
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,32,1,4,power_law_1.01,0.07614719867706299
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,128,4,1,power_law_1.01,2.8916799545288088
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,128,4,1,power_law_1.2,0.5100863933563232
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,32,1,4,power_law_1.01,0.07191680073738098
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,128,4,1,power_law_1.01,3.4828929901123047
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,128,4,1,power_law_1.2,0.9500991821289062
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,32,1,4,power_law_1.01,0.07932800054550171
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,32,1,4,balanced,0.08044266700744629
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,32,1,4,power_law_1.01,0.08010240197181702
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,128,4,1,power_law_1.2,1.0898495674133302
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,128,4,1,power_law_1.01,5.335929489135742
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,32,1,4,power_law_1.01,0.08017280101776122
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,32,1,4,balanced,0.08077866832415263
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,128,4,1,power_law_1.2,1.397657585144043
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,128,4,1,power_law_1.01,10.254854583740235
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,128,4,1,power_law_1.2,1.7100543975830078
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,128,4,1,power_law_1.2,2.3108224868774414
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,128,4,1,power_law_1.2,2.9255680084228515
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,32,1,4,power_law_1.01,0.10758399963378906
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,32,1,4,balanced,0.09590400258700053
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,32,1,4,power_law_1.01,0.10232959985733033
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,128,4,1,power_law_1.2,3.5372993469238283
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,32,1,4,balanced,0.0981226662794749
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,32,1,4,power_law_1.2,0.08254719972610473
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,32,1,4,power_law_1.01,0.11278079748153687
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,32,1,4,balanced,0.09712533156077068
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,32,2,2,balanced,0.056613331039746605
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,32,1,4,power_law_1.2,0.09082239866256714
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,128,4,1,power_law_1.2,5.368588638305664
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,32,1,4,power_law_1.01,0.18279680013656616
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,32,1,4,balanced,0.1773973306020101
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,32,1,4,power_law_1.2,0.09864320158958435
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,32,1,4,power_law_1.01,0.1843135952949524
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,32,1,4,balanced,0.17646400133768717
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,128,4,1,power_law_1.2,10.27088623046875
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,32,1,4,power_law_1.2,0.07631999850273133
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,32,2,2,balanced,0.06098666787147522
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,32,1,4,power_law_1.01,0.19378559589385985
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,32,1,4,balanced,0.1784213383992513
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,32,1,4,power_law_1.2,0.07192320227622986
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,32,2,2,power_law_1.01,0.06445440053939819
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,32,1,4,power_law_1.01,0.2034303903579712
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,32,1,4,balanced,0.17748800913492838
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,32,1,4,power_law_1.2,0.08035839796066284
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,32,2,2,power_law_1.01,0.06766719818115234
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,32,1,4,power_law_1.01,0.2075648069381714
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,32,1,4,balanced,0.1788853406906128
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,32,1,4,power_law_1.2,0.08088319897651672
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,32,2,2,balanced,0.08066133161385854
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,32,1,4,power_law_1.01,0.2561791896820068
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,32,2,2,power_law_1.01,0.07745919823646545
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,32,1,4,balanced,0.18043732643127441
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,32,2,2,balanced,0.08945600191752116
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,32,1,4,power_law_1.2,0.09215999841690063
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,32,1,4,power_law_1.01,0.28092160224914553
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,32,2,2,power_law_1.01,0.07859200239181519
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,32,2,2,balanced,0.07082666456699371
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,32,1,4,balanced,0.18362132708231607
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,32,1,4,power_law_1.2,0.10762879848480225
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,32,1,4,power_law_1.01,0.334169602394104
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,32,2,2,power_law_1.01,0.06901760101318359
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,32,2,2,balanced,0.0820906658967336
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,32,1,4,balanced,0.186463991800944
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,32,1,4,power_law_1.2,0.1055232048034668
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,32,1,4,power_law_1.01,0.4653952121734619
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,32,2,2,power_law_1.01,0.08043519854545593
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,32,2,2,balanced,0.08221333225568135
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,32,1,4,power_law_1.01,0.5679359912872315
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,32,1,4,power_law_1.2,0.11073280572891235
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,32,1,4,balanced,0.301472008228302
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,32,2,2,power_law_1.01,0.08140159845352173
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,32,2,2,balanced,0.08213333288828532
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,32,1,4,power_law_1.2,0.1883903980255127
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,32,1,4,power_law_1.01,0.8333567619323731
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,32,2,2,power_law_1.01,0.0815999984741211
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,32,1,4,balanced,0.3068373401959737
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,32,2,2,balanced,0.07691733539104462
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,32,1,4,power_law_1.2,0.2022655963897705
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,32,2,2,power_law_1.01,0.08503040075302123
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,32,1,4,power_law_1.01,1.1070783615112305
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,32,2,2,balanced,0.07727999985218048
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,32,1,4,balanced,0.46586132049560547
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,32,1,4,power_law_1.2,0.19759360551834107
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,32,2,2,balanced,0.07835199932257335
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,32,2,2,power_law_1.01,0.09530879855155945
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,32,1,4,power_law_1.01,1.367801570892334
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,32,1,4,power_law_1.2,0.2110464096069336
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,32,1,4,balanced,0.5851200024286906
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,32,2,2,balanced,0.10807466506958008
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,32,2,2,power_law_1.01,0.09242240190505982
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,32,1,4,power_law_1.01,1.8677120208740234
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,32,1,4,power_law_1.2,0.21684479713439941
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,32,2,2,balanced,0.10943999886512756
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,32,2,2,power_law_1.01,0.11427839994430541
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,32,1,4,power_law_1.2,0.25550720691680906
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,32,1,4,power_law_1.01,2.3481023788452147
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,32,1,4,balanced,0.8613173166910807
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,32,2,2,balanced,0.10986133416493733
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,32,2,2,power_law_1.01,0.11207679510116578
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,32,1,4,power_law_1.2,0.3058687925338745
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,32,1,4,power_law_1.01,3.7031105041503904
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,32,2,2,balanced,0.16849599281946817
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,32,2,2,power_law_1.01,0.11843839883804322
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,32,1,4,power_law_1.2,0.3726016044616699
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,32,1,4,power_law_1.01,4.340256118774414
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,32,2,2,balanced,0.168938676516215
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,32,1,4,balanced,1.1347253322601318
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,32,1,4,power_law_1.2,0.5504064083099365
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,32,2,2,power_law_1.01,0.21262719631195068
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,32,2,2,balanced,0.17097600301106772
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,32,1,4,power_law_1.2,0.6175487995147705
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,32,2,2,power_law_1.01,0.20658559799194337
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,32,1,4,power_law_1.01,7.322265625
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,32,2,2,balanced,0.17455466588338217
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,32,1,4,power_law_1.2,0.9115263938903808
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,32,2,2,power_law_1.01,0.22007040977478026
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,32,1,4,balanced,1.68941863377889
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,32,1,4,power_law_1.2,1.074028778076172
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,32,2,2,power_law_1.01,0.2641279935836792
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,32,1,4,power_law_1.01,17.882060241699218
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,32,2,2,balanced,0.1782346765200297
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,32,1,4,power_law_1.2,1.8793472290039062
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,32,2,2,power_law_1.01,0.31923840045928953
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,32,2,2,balanced,0.31947733958562213
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,32,2,2,power_law_1.01,0.42237439155578616
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,32,1,4,power_law_1.2,2.5072383880615234
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,32,2,2,balanced,0.32772799332936603
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,32,2,2,power_law_1.01,0.4951807975769043
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,32,1,4,balanced,2.2399840354919434
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,32,1,4,power_law_1.2,3.8217342376708983
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,32,2,2,balanced,0.4780160188674927
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,32,2,2,power_law_1.01,0.6559232234954834
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,32,1,4,power_law_1.2,4.576998519897461
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,32,2,2,power_law_1.01,0.852012825012207
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,32,2,2,balanced,0.6254133383433024
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,32,1,4,power_law_1.2,5.607929611206055
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,32,2,2,power_law_1.01,1.2018176078796388
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,32,2,2,power_law_1.01,1.5283583641052245
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,32,1,4,power_law_1.2,9.811532592773437
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,32,2,2,balanced,0.922223965326945
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,32,1,4,balanced,2.7881654103597007
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,32,2,2,power_law_1.01,2.0348480224609373
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,32,1,4,power_law_1.2,17.116665649414063
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,32,2,2,power_law_1.01,2.9460927963256838
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,32,2,2,balanced,1.2165760199228923
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,32,2,2,power_law_1.01,4.31512336730957
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,32,2,2,power_law_1.01,6.099699020385742
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,32,2,2,balanced,1.8009173075358074
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,32,2,2,power_law_1.01,12.734713745117187
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,32,1,4,balanced,4.4402774175008135
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,32,2,2,balanced,2.3876320521036782
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,32,2,2,power_law_1.2,0.06654080152511596
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,32,2,2,power_law_1.2,0.06607360243797303
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,32,2,2,power_law_1.2,0.07760000228881836
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,32,2,2,balanced,2.9768800735473633
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,32,2,2,power_law_1.2,0.07479040026664734
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,32,2,2,power_law_1.2,0.06926079988479614
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,32,2,2,power_law_1.2,0.08035839796066284
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,32,2,2,power_law_1.2,0.0811456024646759
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,32,2,2,power_law_1.2,0.08346880078315735
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,32,2,2,power_law_1.2,0.08833919763565064
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,32,2,2,power_law_1.2,0.09365760087966919
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,32,2,2,power_law_1.2,0.09882879853248597
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,32,2,2,power_law_1.2,0.1130944013595581
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,32,1,4,balanced,8.88530158996582
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,32,2,2,balanced,4.7446292241414385
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,32,2,2,power_law_1.2,0.11327359676361085
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,32,2,2,power_law_1.2,0.1223039984703064
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,32,2,2,power_law_1.2,0.2163072109222412
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,32,2,2,power_law_1.2,0.2188096046447754
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,32,2,2,power_law_1.2,0.23065600395202637
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,32,2,2,power_law_1.2,0.2876863956451416
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,32,2,2,power_law_1.2,0.3023360013961792
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,32,2,2,power_law_1.2,0.39059839248657224
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,32,2,2,power_law_1.2,0.5116159915924072
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,32,4,1,balanced,0.03218133250872294
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,32,2,2,power_law_1.2,0.6854720115661621
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,32,4,1,balanced,0.039621333281199135
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,32,2,2,power_law_1.2,0.9380991935729981
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,32,2,2,power_law_1.2,1.3695679664611817
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,32,2,2,power_law_1.2,1.662451171875
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,32,4,1,balanced,0.051455999414126076
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,32,2,2,power_law_1.2,2.6287296295166014
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,32,4,1,balanced,0.07987200220425923
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,32,2,2,power_law_1.2,3.3365440368652344
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,32,4,1,power_law_1.01,0.031052801012992858
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,32,2,2,power_law_1.2,4.0817920684814455
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,32,2,2,balanced,9.464848200480143
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,32,4,1,balanced,0.07166400055090587
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,32,4,1,power_law_1.01,0.037529599666595456
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,32,2,2,power_law_1.2,7.364447784423828
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,32,4,1,balanced,0.06739200154940288
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,32,4,1,power_law_1.01,0.04534400105476379
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,32,4,1,balanced,0.06833066542943318
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,32,2,2,power_law_1.2,13.239704895019532
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,32,4,1,power_law_1.01,0.05591679811477661
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,32,4,1,balanced,0.07425066828727722
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,32,4,1,power_law_1.01,0.07066879868507385
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,32,4,1,balanced,0.07504533231258392
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,32,4,1,power_law_1.01,0.06606079936027527
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,32,4,1,balanced,0.07505600154399872
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,32,4,1,power_law_1.01,0.07181439995765686
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,32,4,1,balanced,0.07496533294518788
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,32,4,1,power_law_1.01,0.07707520127296448
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,32,4,1,balanced,0.0745119998852412
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,32,4,1,power_law_1.01,0.07960960268974304
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,32,4,1,balanced,0.07450133562088013
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,32,4,1,power_law_1.01,0.08206719756126404
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,32,4,1,balanced,0.07559466858704884
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,32,4,1,power_law_1.01,0.09492480158805847
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,32,4,1,balanced,0.10338667035102844
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,32,4,1,power_law_1.01,0.0923904001712799
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,32,4,1,balanced,0.10479467113812764
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,32,4,1,power_law_1.01,0.10040960311889649
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,32,4,1,balanced,0.1069653332233429
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,32,4,1,power_law_1.01,0.10763520002365112
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,32,4,1,balanced,0.17935999234517416
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,32,4,1,power_law_1.01,0.11542400121688842
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,32,4,1,balanced,0.18461867173512778
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,32,4,1,power_law_1.01,0.1351423978805542
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,32,4,1,balanced,0.3338773250579834
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,32,4,1,power_law_1.01,0.15124479532241822
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,32,4,1,power_law_1.01,0.2601599931716919
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,32,4,1,balanced,0.34397868315378827
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,32,4,1,power_law_1.01,0.28935039043426514
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,32,4,1,power_law_1.2,0.031667199730873105
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,32,4,1,balanced,0.5044159889221191
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,32,4,1,power_law_1.01,0.3707072019577026
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,32,4,1,power_law_1.2,0.03814400136470795
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,32,4,1,power_law_1.01,0.44339838027954104
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,32,4,1,balanced,0.6607679923375448
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,32,4,1,power_law_1.2,0.04492799937725067
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,32,4,1,power_law_1.01,0.5877823829650879
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,32,4,1,power_law_1.2,0.05358080267906189
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,32,4,1,balanced,0.9710666338602701
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,32,4,1,power_law_1.01,0.7474175930023194
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,32,4,1,power_law_1.2,0.07061120271682739
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,4096,14336,2,8,1,8,balanced,0.11924266815185547
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,32,4,1,power_law_1.01,1.0524864196777344
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,32,4,1,power_law_1.2,0.07162240147590637
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,4096,14336,2,8,1,8,balanced,0.11667733391125996
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,32,4,1,balanced,1.2829173405965169
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,32,4,1,power_law_1.2,0.07511680126190186
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,32,4,1,power_law_1.01,1.3630271911621095
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,4096,14336,2,8,1,8,balanced,0.08523733417193095
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,4096,14336,2,8,1,8,balanced,0.11395200093587239
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,32,4,1,power_law_1.2,0.07750399708747864
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,32,4,1,power_law_1.01,1.9699071884155273
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,4096,14336,2,8,1,8,balanced,0.11497066418329875
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,4096,14336,2,8,1,8,balanced,0.08145600060621898
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,32,4,1,power_law_1.2,0.07969279885292054
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,32,4,1,power_law_1.01,2.587936019897461
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,4096,14336,2,8,1,8,balanced,0.11500266194343567
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,4096,14336,2,8,1,8,balanced,0.08175466458002727
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,32,4,1,balanced,1.8942933082580566
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,32,4,1,power_law_1.2,0.08379520177841186
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,4096,14336,2,8,1,8,balanced,0.11666133006413777
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,32,4,1,power_law_1.01,3.200998306274414
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,4096,14336,2,8,1,8,balanced,0.08268266419569652
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,32,4,1,power_law_1.2,0.09935359954833985
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,4096,14336,2,8,1,8,balanced,0.11640533804893494
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,4096,14336,2,8,1,8,balanced,0.08429333567619324
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,32,4,1,power_law_1.01,5.03361930847168
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,32,4,1,power_law_1.2,0.0943615972995758
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,4096,14336,2,8,1,8,balanced,0.08412266770998637
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,4096,14336,2,8,1,8,balanced,0.11612266302108765
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,32,4,1,power_law_1.2,0.09880959987640381
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,4096,14336,2,8,1,8,balanced,0.08348266283671062
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,4096,14336,2,8,1,8,balanced,0.1249066690603892
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,32,4,1,power_law_1.01,9.95156478881836
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,32,4,1,balanced,2.508885383605957
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,32,4,1,power_law_1.2,0.10581120252609252
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,4096,14336,2,8,1,8,balanced,0.08684266606966655
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,4096,14336,2,8,1,8,balanced,0.12599999705950418
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,4096,14336,2,8,1,8,balanced,0.08726400136947632
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,32,4,1,power_law_1.2,0.12227200269699097
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,4096,14336,2,8,1,8,balanced,0.12626666824022928
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,4096,14336,2,8,1,8,balanced,0.08699733018875122
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,32,4,1,power_law_1.2,0.13752319812774658
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,4096,14336,2,8,1,8,balanced,0.1301759978135427
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,4096,14336,2,8,1,8,balanced,0.08673066894213359
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,32,4,1,power_law_1.2,0.15107200145721436
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,4096,14336,2,8,1,8,balanced,0.13120533029238382
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,4096,14336,2,8,1,8,balanced,0.0864586631457011
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,32,4,1,balanced,3.1179412206014
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,32,4,1,power_law_1.2,0.264736008644104
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,4096,14336,2,8,1,8,balanced,0.139957328637441
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,4096,14336,2,8,1,8,balanced,0.08623466889063518
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,32,4,1,power_law_1.2,0.29843840599060056
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,4096,14336,2,8,1,8,balanced,0.14017066359519958
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,4096,14336,2,8,1,8,balanced,0.0946666697661082
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,32,4,1,power_law_1.2,0.369267201423645
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,4096,14336,2,8,1,8,balanced,0.14196266730626425
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,4096,14336,2,8,1,8,balanced,0.0981760025024414
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,32,4,1,power_law_1.2,0.4370431900024414
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,4096,14336,2,8,1,8,balanced,0.16315199931462607
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,4096,14336,2,8,1,8,balanced,0.0988213320573171
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,4096,14336,2,8,1,8,balanced,0.19937066237131754
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,32,4,1,power_law_1.2,0.5957632064819336
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,4096,14336,2,8,1,8,balanced,0.1037493348121643
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,4096,14336,2,8,1,8,balanced,0.20572799444198608
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,4096,14336,2,8,1,8,balanced,0.13612799843152365
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,32,4,1,power_law_1.2,0.744326400756836
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,32,4,1,balanced,4.959295908610026
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,4096,14336,2,8,1,8,balanced,0.12948800126711527
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,4096,14336,2,8,1,8,balanced,0.2653119961420695
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,32,4,1,power_law_1.2,1.0587008476257325
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,4096,14336,2,8,1,8,balanced,0.19317332903544107
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,4096,14336,2,8,1,8,balanced,0.28623465696970624
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,32,4,1,power_law_1.2,1.3644351959228516
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,4096,14336,2,8,1,8,balanced,0.07441066702206929
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,4096,14336,2,8,1,8,balanced,0.1941866676012675
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,4096,14336,2,8,1,8,balanced,0.4429759979248047
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,32,4,1,power_law_1.2,1.9647552490234375
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,4096,14336,2,8,1,8,balanced,0.07459199925263722
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,4096,14336,2,8,1,8,balanced,0.29024000962575275
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,32,4,1,power_law_1.2,2.578220748901367
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,4096,14336,2,8,1,8,balanced,0.5000426769256592
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,4096,14336,2,8,1,8,balanced,0.073253333568573
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,4096,14336,2,8,1,8,balanced,0.329855998357137
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,4096,14336,2,8,1,8,balanced,0.07638399799664815
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,32,4,1,power_law_1.2,3.1803520202636717
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,4096,14336,2,8,1,8,balanced,0.7443733215332031
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,4096,14336,2,8,1,8,balanced,0.07763200004895528
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,4096,14336,2,8,1,8,balanced,0.5160106817881266
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,32,4,1,power_law_1.2,5.008819198608398
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,4096,14336,2,8,1,8,balanced,0.07860800127188365
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,4096,14336,2,8,1,8,balanced,0.9216427008310953
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,4096,14336,2,8,1,8,balanced,0.08020266890525818
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,4096,14336,2,8,1,8,balanced,0.6157493193944296
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,32,4,1,power_law_1.2,9.859129333496094
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,4096,14336,2,8,1,8,balanced,0.07967466612656911
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,4096,14336,2,8,1,8,balanced,1.3697919845581055
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,4096,14336,2,8,1,8,power_law_1.01,0.11549439430236816
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,4096,14336,2,8,1,8,balanced,0.9019359747568766
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,4096,14336,2,8,1,8,power_law_1.01,0.08064000010490417
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,4096,14336,2,8,1,8,balanced,0.08217066526412964
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,4096,14336,2,8,1,8,power_law_1.01,0.11847039461135864
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,32,4,1,balanced,9.881216049194336
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,4096,14336,2,8,1,8,power_law_1.01,0.11818879842758179
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,4096,14336,2,8,1,8,balanced,0.082805335521698
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,4096,14336,2,8,1,8,power_law_1.01,0.08026880025863647
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,4096,14336,2,8,1,8,balanced,1.8108426729838054
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,4096,14336,2,8,1,8,power_law_1.01,0.11691520214080811
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,4096,14336,2,8,1,8,balanced,1.1834080219268799
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,4096,14336,2,8,1,8,power_law_1.01,0.08295680284500122
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,4096,14336,2,8,1,8,power_law_1.01,0.11690239906311035
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,4096,14336,2,8,1,8,power_law_1.01,0.12337919473648071
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,4096,14336,2,8,1,8,power_law_1.01,0.08258559703826904
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,4096,14336,2,8,1,8,power_law_1.01,0.13552639484405518
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,4096,14336,2,8,1,8,balanced,2.2154080073038735
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,4096,14336,2,8,1,8,power_law_1.01,0.14202879667282103
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,4096,14336,2,8,1,8,power_law_1.01,0.08331519961357117
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,4096,14336,2,8,1,8,power_law_1.01,0.1422719955444336
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,4096,14336,2,8,1,8,balanced,1.4512319564819336
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,4096,14336,2,8,1,8,power_law_1.01,0.21801600456237794
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,4096,14336,2,8,1,8,power_law_1.01,0.09317119717597962
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,4096,14336,2,8,1,8,balanced,0.08339732885360718
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,4096,14336,2,8,1,8,power_law_1.01,0.21799039840698242
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,4096,14336,2,8,1,8,power_law_1.01,0.10001280307769775
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,4096,14336,2,8,1,8,balanced,0.0843946635723114
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,4096,14336,2,8,1,8,power_law_1.01,0.25763840675354005
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,4096,14336,2,8,1,8,power_law_1.01,0.30716800689697266
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,4096,14336,2,8,1,8,power_law_1.01,0.09441919922828675
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,4096,14336,2,8,1,8,balanced,0.08656533559163411
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,4096,14336,2,8,1,8,balanced,3.547642707824707
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,4096,14336,2,8,1,8,power_law_1.01,0.21162240505218505
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,4096,14336,2,8,1,8,power_law_1.01,0.10540800094604492
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,4096,14336,2,8,1,8,power_law_1.01,0.2449728012084961
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,4096,14336,2,8,1,8,balanced,2.30894406636556
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,4096,14336,2,8,1,8,balanced,0.08578667044639587
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,4096,14336,2,8,1,8,power_law_1.01,0.28250880241394044
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,4096,14336,2,8,1,8,power_law_1.01,0.109990394115448
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,4096,14336,2,8,1,8,power_law_1.01,0.3485311985015869
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,4096,14336,2,8,1,8,power_law_1.01,0.1145792007446289
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,4096,14336,2,8,1,8,power_law_1.01,0.5300159931182862
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,4096,14336,2,8,1,8,power_law_1.01,0.13010560274124144
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,4096,14336,2,8,1,8,power_law_1.01,0.6267583847045899
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,4096,14336,2,8,1,8,power_law_1.01,0.9254719734191894
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,4096,14336,2,8,1,8,power_law_1.01,0.13781119585037233
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,4096,14336,2,8,1,8,power_law_1.01,0.8884608268737793
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,4096,14336,2,8,1,8,power_law_1.01,0.12643840312957763
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,4096,14336,2,8,1,8,balanced,0.09682666261990865
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,4096,14336,2,8,1,8,power_law_1.01,1.2214847564697267
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,4096,14336,2,8,1,8,power_law_1.01,0.15882240533828734
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,4096,14336,2,8,1,8,power_law_1.01,1.7982463836669922
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,4096,14336,2,8,1,8,balanced,0.09936533371607463
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,4096,14336,2,8,1,8,power_law_1.01,0.1664255976676941
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,4096,14336,2,8,1,8,balanced,7.0986989339192705
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,4096,14336,2,8,1,8,power_law_1.01,2.596403121948242
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,4096,14336,2,8,1,8,balanced,4.567754745483398
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,4096,14336,2,8,1,8,balanced,0.10178666313489278
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,4096,14336,2,8,1,8,power_law_1.01,0.19685120582580568
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,4096,14336,2,8,1,8,power_law_1.01,3.5132030487060546
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,4096,14336,2,8,1,8,power_law_1.01,0.27642240524291994
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,4096,14336,2,8,1,8,power_law_1.01,4.777740859985352
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,4096,14336,2,8,1,8,power_law_1.01,0.3811647891998291
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,4096,14336,2,8,1,8,power_law_1.01,7.599404907226562
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,4096,14336,2,8,1,8,balanced,0.13478400309880575
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,4096,14336,2,8,1,8,power_law_1.01,0.5750271797180175
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,4096,14336,2,8,1,8,power_law_1.01,9.114252471923828
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,4096,14336,2,8,1,8,balanced,0.140773336092631
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,4096,14336,2,8,1,8,power_law_1.01,0.552288007736206
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,4096,14336,2,8,1,8,power_law_1.01,0.8127679824829102
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,4096,14336,2,8,1,8,power_law_1.01,14.049125671386719
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,4096,14336,2,8,1,8,power_law_1.01,1.0531647682189942
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,4096,14336,2,8,1,8,power_law_1.01,1.490771198272705
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,4096,14336,2,8,1,8,power_law_1.01,29.405484008789063
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,4096,14336,2,8,1,8,balanced,0.18937599658966064
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,4096,14336,2,8,1,8,power_law_1.01,1.8898944854736328
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,4096,14336,2,8,1,8,power_law_1.01,2.7958656311035157
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,4096,14336,2,8,1,8,power_law_1.01,3.8955711364746093
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,4096,14336,2,8,1,8,power_law_1.01,5.172832107543945
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,4096,14336,2,8,1,8,balanced,0.22378132740656534
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,4096,14336,2,8,1,8,power_law_1.01,8.156761932373048
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,4096,14336,2,8,1,8,power_law_1.01,16.872909545898438
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,4096,14336,2,8,1,8,balanced,0.3547946612040202
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,4096,14336,2,8,1,8,power_law_1.01,0.07332479953765869
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,4096,14336,2,8,1,8,balanced,0.4277493158976237
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,4096,14336,2,8,1,8,power_law_1.01,0.07304959893226623
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,4096,14336,2,8,1,8,balanced,0.6345653136571249
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,4096,14336,2,8,1,8,power_law_1.01,0.07426559925079346
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,4096,14336,2,8,1,8,balanced,0.8330399990081787
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,4096,14336,2,8,1,8,power_law_1.01,0.07653120160102844
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,4096,14336,2,8,1,8,power_law_1.01,0.07760639786720276
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,4096,14336,2,8,1,8,balanced,1.2299466927846272
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,4096,14336,2,8,1,8,power_law_1.01,0.09262719750404358
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,4096,14336,2,8,1,8,power_law_1.01,0.09644160270690919
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,4096,14336,2,8,1,8,power_law_1.01,0.1095039963722229
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,4096,14336,2,8,1,8,balanced,1.6448639233907063
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,4096,14336,2,8,1,8,power_law_1.01,0.11719679832458496
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,4096,14336,2,8,1,8,power_law_1.01,0.1364799976348877
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,4096,14336,2,8,1,8,balanced,2.0366080602010093
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,4096,14336,2,8,1,8,power_law_1.01,0.10951679944992065
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,4096,14336,2,8,1,8,power_law_1.01,0.12344959974288941
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,4096,14336,2,8,1,8,power_law_1.01,0.14426239728927612
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,4096,14336,2,8,1,8,balanced,3.2405761082967124
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,4096,14336,2,8,1,8,power_law_1.01,0.19465600252151488
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,4096,14336,2,8,1,8,power_law_1.2,0.11555839776992798
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,4096,14336,2,8,1,8,power_law_1.01,0.1793727993965149
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,4096,14336,2,8,1,8,power_law_1.2,0.11876480579376221
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,4096,14336,2,8,1,8,power_law_1.01,0.20456960201263427
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,4096,14336,2,8,1,8,power_law_1.2,0.11827199459075928
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,4096,14336,2,8,1,8,power_law_1.01,0.2757440090179443
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,4096,14336,2,8,1,8,power_law_1.2,0.11640959978103638
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,4096,14336,2,8,1,8,power_law_1.2,0.11705600023269654
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,4096,14336,2,8,1,8,power_law_1.01,0.3536895990371704
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,4096,14336,2,8,1,8,balanced,6.411274592081706
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,4096,14336,2,8,1,8,power_law_1.2,0.08030080199241638
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,4096,14336,2,8,1,8,power_law_1.2,0.12382719516754151
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,4096,14336,2,8,1,8,power_law_1.01,0.43566079139709474
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,4096,14336,2,8,1,8,power_law_1.2,0.0804095983505249
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,4096,14336,2,8,1,8,power_law_1.2,0.1366912007331848
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,4096,14336,2,8,1,8,power_law_1.2,0.08115199804306031
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,4096,14336,2,8,1,8,power_law_1.01,0.5921664237976074
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,4096,14336,2,8,1,8,power_law_1.2,0.13789440393447877
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,4096,14336,2,8,1,8,power_law_1.2,0.08184319734573364
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,4096,14336,2,8,1,8,power_law_1.2,0.08288000226020813
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,4096,14336,2,8,1,8,power_law_1.2,0.1599552035331726
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,4096,14336,2,8,1,8,power_law_1.2,0.08670719861984252
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,4096,14336,2,8,1,8,power_law_1.2,0.10338560342788697
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,4096,14336,2,8,1,8,power_law_1.01,0.7325056076049805
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,4096,14336,2,8,1,8,power_law_1.2,0.2146239995956421
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,4096,14336,2,8,1,8,power_law_1.2,0.09658880233764648
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,4096,14336,2,8,1,8,power_law_1.2,0.10787839889526367
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,4096,14336,2,8,1,8,power_law_1.2,0.2256319999694824
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,4096,14336,2,8,1,8,power_law_1.2,0.11502079963684082
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,4096,14336,2,8,1,8,power_law_1.01,1.2832768440246582
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,4096,14336,2,8,1,8,power_law_1.2,0.27409279346466064
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,4096,14336,2,8,1,8,power_law_1.2,0.11461119651794434
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,4096,14336,2,8,1,8,power_law_1.2,0.1385599970817566
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,4096,14336,2,8,1,8,power_law_1.01,1.5575743675231934
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,4096,14336,2,8,1,8,power_law_1.2,0.29149439334869387
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,4096,14336,2,8,1,8,power_law_1.2,0.15025919675827026
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,4096,14336,2,8,1,8,power_law_1.2,0.22389121055603028
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,4096,14336,2,8,1,8,power_law_1.2,0.12602239847183228
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,4096,14336,2,8,1,8,power_law_1.01,2.1516223907470704
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,4096,14336,2,8,1,8,power_law_1.2,0.15780479907989503
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,4096,14336,2,8,1,8,power_law_1.2,0.26524159908294676
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,4096,14336,2,8,1,8,power_law_1.2,0.17534719705581664
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,4096,14336,2,8,1,8,power_law_1.01,3.127673530578613
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,4096,14336,2,8,1,8,power_law_1.2,0.21391360759735106
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,4096,14336,2,8,1,8,power_law_1.2,0.3184000015258789
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,4096,14336,2,8,1,8,power_law_1.01,3.953504180908203
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,4096,14336,2,8,1,8,power_law_1.2,0.2866175889968872
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,4096,14336,2,8,1,8,power_law_1.2,0.3563839912414551
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,4096,14336,2,8,1,8,power_law_1.2,0.35190401077270506
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,4096,14336,2,8,1,8,power_law_1.2,0.5036928176879882
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,4096,14336,2,8,1,8,power_law_1.01,5.593862533569336
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,4096,14336,2,8,1,8,power_law_1.2,0.551251220703125
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,4096,14336,2,8,1,8,power_law_1.2,0.6956160068511963
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,4096,14336,2,8,1,8,power_law_1.2,0.5656447887420655
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,4096,14336,2,8,2,4,balanced,0.07554133236408234
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,4096,14336,2,8,1,8,power_law_1.2,0.7934720039367675
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,4096,14336,2,8,1,8,power_law_1.01,7.150918579101562
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,4096,14336,2,8,1,8,power_law_1.2,1.0224703788757323
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,4096,14336,2,8,1,8,power_law_1.2,1.0164095878601074
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,4096,14336,2,8,2,4,balanced,0.0717439999183019
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,4096,14336,2,8,1,8,power_law_1.2,0.9115200042724609
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,4096,14336,2,8,1,8,power_law_1.2,1.564793586730957
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,4096,14336,2,8,2,4,balanced,0.10572266578674316
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,4096,14336,2,8,1,8,power_law_1.01,11.831449890136719
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,4096,14336,2,8,1,8,power_law_1.2,1.9826047897338868
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,4096,14336,2,8,1,8,power_law_1.2,1.3212096214294433
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,4096,14336,2,8,1,8,power_law_1.2,0.07234560251235962
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,4096,14336,2,8,2,4,balanced,0.10784000158309937
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,4096,14336,2,8,1,8,power_law_1.2,3.1026687622070312
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,4096,14336,2,8,1,8,power_law_1.2,1.8538175582885743
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,4096,14336,2,8,1,8,power_law_1.2,0.07271680235862732
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,4096,14336,2,8,1,8,power_law_1.2,4.184281539916992
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,4096,14336,2,8,2,4,balanced,0.10892800490061443
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,4096,14336,2,8,1,8,power_law_1.2,2.650246429443359
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,4096,14336,2,8,1,8,power_law_1.01,24.018963623046876
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,4096,14336,2,8,1,8,power_law_1.2,0.07281919717788696
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,4096,14336,2,8,1,8,power_law_1.2,5.254924774169922
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,4096,14336,2,8,2,4,balanced,0.10956799983978271
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,4096,14336,2,8,2,4,balanced,0.05860800047715505
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,4096,14336,2,8,1,8,power_law_1.2,3.415436935424805
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,4096,14336,2,8,1,8,power_law_1.2,0.07608320116996765
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,4096,14336,2,8,1,8,power_law_1.2,7.566400146484375
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,4096,14336,2,8,2,4,balanced,0.11247467001279195
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,4096,14336,2,8,2,4,balanced,0.05609600245952606
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,4096,14336,2,8,1,8,power_law_1.2,0.07701759934425353
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,4096,14336,2,8,1,8,power_law_1.2,5.536851119995117
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,4096,14336,2,8,2,4,balanced,0.11014933387438457
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,4096,14336,2,8,2,4,balanced,0.07584000130494435
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,4096,14336,2,8,1,8,power_law_1.2,15.952774047851562
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,4096,14336,2,8,1,8,power_law_1.2,0.09039999842643738
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,4096,14336,2,8,2,4,balanced,0.11500799655914307
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,4096,14336,2,8,2,4,balanced,0.07612800101439159
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,4096,14336,2,8,1,8,power_law_1.2,7.676242828369141
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,4096,14336,2,8,1,8,power_law_1.2,0.09940479993820191
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,4096,14336,2,8,2,4,balanced,0.11486400167147319
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,4096,14336,2,8,2,4,balanced,0.07607466479142506
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,4096,14336,2,8,1,8,power_law_1.2,0.11175680160522461
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,4096,14336,2,8,2,4,balanced,0.1197760005791982
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,4096,14336,2,8,1,8,power_law_1.2,9.72647705078125
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,4096,14336,2,8,2,4,balanced,0.07749333480993907
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,4096,14336,2,8,2,4,balanced,0.0773226668437322
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,4096,14336,2,8,2,4,balanced,0.12467733025550842
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,4096,14336,2,8,1,8,power_law_1.2,0.11545599699020385
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,4096,14336,2,8,1,8,power_law_1.2,15.363795471191406
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,4096,14336,2,8,2,4,balanced,0.07842133442560832
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,4096,14336,2,8,2,4,balanced,0.12446932991345723
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,4096,14336,2,8,1,8,power_law_1.2,0.1388864040374756
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,4096,14336,2,8,2,4,balanced,0.07870933413505554
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,4096,14336,2,8,2,4,balanced,0.13030399878819784
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,4096,14336,2,8,2,4,balanced,0.0788800021012624
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,4096,14336,2,8,2,4,balanced,0.14197867115338644
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,4096,14336,2,8,1,8,power_law_1.2,29.775149536132812
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,4096,14336,2,8,2,4,balanced,0.08187733093897502
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,4096,14336,2,8,2,4,balanced,0.14363732933998108
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,4096,14336,2,8,1,8,power_law_1.2,0.11756160259246826
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,4096,14336,2,8,2,4,balanced,0.08230400085449219
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,4096,14336,2,8,1,8,power_law_1.2,0.12391680479049683
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,4096,14336,2,8,2,4,balanced,0.16249600052833557
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,4096,14336,2,8,2,4,balanced,0.08441600203514099
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,4096,14336,2,8,1,8,power_law_1.2,0.13877760171890258
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,4096,14336,2,8,2,4,balanced,0.17959467569986978
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,4096,14336,2,8,2,4,balanced,0.08974400162696838
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,4096,14336,2,8,1,8,power_law_1.2,0.19557759761810303
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,4096,14336,2,8,2,4,balanced,0.19599467515945435
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,4096,14336,2,8,2,4,balanced,0.09637866417566936
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,4096,14336,2,8,2,4,balanced,0.2840426762898763
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,4096,14336,2,8,2,4,balanced,0.047775998711586
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,4096,14336,2,8,2,4,balanced,0.09750933448473613
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,4096,14336,2,8,2,4,balanced,0.28914133707682294
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,4096,14336,2,8,1,8,power_law_1.2,0.1893183946609497
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,4096,14336,2,8,2,4,balanced,0.04886400202910105
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,4096,14336,2,8,2,4,balanced,0.1018986701965332
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,4096,14336,2,8,2,4,balanced,0.06752533217271169
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,4096,14336,2,8,1,8,power_law_1.2,0.19333120584487914
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,4096,14336,2,8,2,4,balanced,0.4192533493041992
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,4096,14336,2,8,2,4,balanced,0.12034666538238525
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,4096,14336,2,8,2,4,balanced,0.07072000205516815
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,4096,14336,2,8,1,8,power_law_1.2,0.27296640872955324
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,4096,14336,2,8,2,4,balanced,0.5323466857274374
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,4096,14336,2,8,2,4,balanced,0.13750400145848593
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,4096,14336,2,8,2,4,balanced,0.07130133112271626
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,4096,14336,2,8,2,4,balanced,0.072543998559316
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,4096,14336,2,8,2,4,balanced,0.19082132975260416
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,4096,14336,2,8,1,8,power_law_1.2,0.34945919513702395
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,4096,14336,2,8,2,4,balanced,0.7813226381937662
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,4096,14336,2,8,2,4,balanced,0.07347733279069264
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,4096,14336,2,8,1,8,power_law_1.2,0.48978562355041505
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,4096,14336,2,8,2,4,balanced,0.20403200387954712
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,4096,14336,2,8,2,4,balanced,0.9579839706420898
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,4096,14336,2,8,2,4,balanced,0.0730453332265218
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,4096,14336,2,8,2,4,balanced,0.2881706754366557
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,4096,14336,2,8,1,8,power_law_1.2,0.6293824195861817
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,4096,14336,2,8,2,4,balanced,0.3408000071843465
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,4096,14336,2,8,2,4,balanced,1.4159146944681804
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,4096,14336,2,8,2,4,balanced,0.07892266909281413
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,4096,14336,2,8,1,8,power_law_1.2,0.832646369934082
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,4096,14336,2,8,2,4,balanced,0.07910400132338206
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,4096,14336,2,8,2,4,balanced,0.49908800919850665
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,4096,14336,2,8,2,4,balanced,1.842400074005127
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,4096,14336,2,8,1,8,power_law_1.2,1.2427519798278808
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,4096,14336,2,8,2,4,balanced,0.6389013528823853
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,4096,14336,2,8,1,8,power_law_1.2,1.4564736366271973
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,4096,14336,2,8,2,4,balanced,2.25654935836792
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,4096,14336,2,8,1,8,power_law_1.2,2.3682815551757814
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,4096,14336,2,8,2,4,balanced,0.9296480019887289
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,4096,14336,2,8,2,4,balanced,0.07792533437410991
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,4096,14336,2,8,1,8,power_law_1.2,3.1055360794067384
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,4096,14336,2,8,2,4,balanced,0.07976533472537994
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,4096,14336,2,8,1,8,power_law_1.2,4.253177642822266
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,4096,14336,2,8,2,4,balanced,0.08149866759777069
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,4096,14336,2,8,2,4,balanced,1.228005329767863
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,4096,14336,2,8,2,4,balanced,3.7066240310668945
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,4096,14336,2,8,1,8,power_law_1.2,6.2467201232910154
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,4096,14336,2,8,2,4,balanced,0.08168533444404602
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,4096,14336,2,8,2,4,power_law_1.01,0.0980288028717041
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,4096,14336,2,8,1,8,power_law_1.2,7.504812622070313
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,4096,14336,2,8,2,4,power_law_1.01,0.09772800207138062
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,4096,14336,2,8,2,4,balanced,1.501237392425537
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,4096,14336,2,8,2,4,power_law_1.01,0.09793919920921326
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,4096,14336,2,8,1,8,power_law_1.2,12.120095825195312
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,4096,14336,2,8,2,4,power_law_1.01,0.10734080076217652
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,4096,14336,2,8,2,4,power_law_1.01,0.10286719799041748
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,4096,14336,2,8,2,4,balanced,0.0926026701927185
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,4096,14336,2,8,2,4,power_law_1.01,0.11140480041503906
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,4096,14336,2,8,1,8,power_law_1.2,24.931552124023437
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,4096,14336,2,8,2,4,balanced,2.440554618835449
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,4096,14336,2,8,2,4,power_law_1.01,0.11664639711380005
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,4096,14336,2,8,2,4,balanced,0.09512000282605489
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,4096,14336,2,8,2,4,balanced,7.382368087768555
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,4096,14336,2,8,2,4,power_law_1.01,0.1187391996383667
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,4096,14336,2,8,2,4,balanced,0.09798933068911235
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,4096,14336,2,8,2,4,power_law_1.01,0.14514559507369995
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,4096,14336,2,8,2,4,balanced,0.13377599914868674
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,4096,14336,2,8,2,4,power_law_1.01,0.1471935987472534
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,4096,14336,2,8,2,4,balanced,0.142277330160141
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,4096,14336,2,8,2,4,power_law_1.01,0.15449600219726561
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,4096,14336,2,8,2,4,power_law_1.01,0.17383040189743043
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,4096,14336,2,8,2,4,power_law_1.01,0.18310400247573852
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,4096,14336,2,8,2,4,balanced,4.909573237101237
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,4096,14336,2,8,2,4,balanced,0.19926400979359946
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,4096,14336,2,8,2,4,power_law_1.01,0.18466559648513795
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,4096,14336,2,8,2,4,balanced,0.24157333374023438
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,4096,14336,2,8,2,4,power_law_1.01,0.20171520709991456
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,4096,14336,2,8,2,4,power_law_1.01,0.20925440788269042
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,4096,14336,2,8,2,4,power_law_1.01,0.25167999267578123
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,4096,14336,2,8,2,4,power_law_1.01,0.3264512062072754
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,4096,14336,2,8,2,4,balanced,0.3701173464457194
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,4096,14336,2,8,2,4,power_law_1.01,0.38584959506988525
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,4096,14336,2,8,2,4,balanced,0.4806400140126546
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,4096,14336,2,8,2,4,power_law_1.01,0.5973375797271728
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,4096,14336,2,8,2,4,power_law_1.01,0.5803967952728272
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,4096,14336,2,8,2,4,balanced,0.7394879659016927
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,4096,14336,2,8,2,4,power_law_1.01,0.06424319744110107
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,4096,14336,2,8,2,4,power_law_1.01,0.9260607719421386
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,4096,14336,2,8,2,4,balanced,0.9869013627370199
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,4096,14336,2,8,2,4,power_law_1.01,0.06700800061225891
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,4096,14336,2,8,2,4,power_law_1.01,1.173344039916992
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,4096,14336,2,8,2,4,power_law_1.01,0.07381119728088378
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,4096,14336,2,8,2,4,power_law_1.01,0.07493119835853576
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,4096,14336,2,8,2,4,power_law_1.01,1.9590335845947267
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,4096,14336,2,8,2,4,power_law_1.01,0.07505279779434204
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,4096,14336,2,8,2,4,power_law_1.01,0.06334720253944397
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,4096,14336,2,8,2,4,balanced,1.4589920043945312
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,4096,14336,2,8,2,4,power_law_1.01,2.5783103942871093
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,4096,14336,2,8,2,4,power_law_1.01,0.07772799730300903
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,4096,14336,2,8,2,4,power_law_1.01,0.06312320232391358
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,4096,14336,2,8,2,4,power_law_1.01,0.09032319784164429
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,4096,14336,2,8,2,4,power_law_1.01,0.08331519961357117
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,4096,14336,2,8,2,4,power_law_1.01,4.158643341064453
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,4096,14336,2,8,2,4,power_law_1.01,0.0551360011100769
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,4096,14336,2,8,2,4,power_law_1.01,0.08531200289726257
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,4096,14336,2,8,2,4,balanced,1.9459360440572102
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,4096,14336,2,8,2,4,power_law_1.01,0.08919039964675904
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,4096,14336,2,8,2,4,power_law_1.01,0.07064319849014282
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,4096,14336,2,8,2,4,power_law_1.2,0.09322239756584168
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,4096,14336,2,8,2,4,power_law_1.01,4.688985443115234
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,4096,14336,2,8,2,4,power_law_1.01,0.08942720293998718
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,4096,14336,2,8,2,4,power_law_1.01,0.070387202501297
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,4096,14336,2,8,2,4,power_law_1.01,0.09687039852142335
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,4096,14336,2,8,2,4,power_law_1.2,0.07816320061683654
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,4096,14336,2,8,2,4,power_law_1.01,7.324928283691406
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,4096,14336,2,8,2,4,power_law_1.01,0.10063999891281128
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,4096,14336,2,8,2,4,power_law_1.01,0.07544320225715637
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,4096,14336,2,8,2,4,power_law_1.2,0.10885119438171387
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,4096,14336,2,8,2,4,power_law_1.01,0.11665920019149781
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,4096,14336,2,8,2,4,balanced,2.408986727396647
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,4096,14336,2,8,2,4,power_law_1.01,0.08407679796218873
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,4096,14336,2,8,2,4,power_law_1.01,0.13200000524520875
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,4096,14336,2,8,2,4,power_law_1.01,10.882361602783202
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,4096,14336,2,8,2,4,power_law_1.2,0.10851839780807496
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,4096,14336,2,8,2,4,power_law_1.01,0.13262079954147338
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,4096,14336,2,8,2,4,power_law_1.01,0.09457280039787293
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,4096,14336,2,8,2,4,power_law_1.2,0.10910719633102417
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,4096,14336,2,8,2,4,power_law_1.01,0.15104639530181885
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,4096,14336,2,8,2,4,power_law_1.01,19.191436767578125
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,4096,14336,2,8,2,4,power_law_1.2,0.11230080127716065
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,4096,14336,2,8,2,4,power_law_1.01,0.19322240352630615
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,4096,14336,2,8,2,4,power_law_1.01,0.10568959712982177
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,4096,14336,2,8,2,4,power_law_1.01,0.2361664056777954
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,4096,14336,2,8,2,4,power_law_1.2,0.11678719520568848
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,4096,14336,2,8,2,4,power_law_1.01,0.1000704050064087
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,4096,14336,2,8,2,4,balanced,3.857050577799479
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,4096,14336,2,8,2,4,power_law_1.01,0.3179392099380493
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,4096,14336,2,8,2,4,power_law_1.2,0.1197119951248169
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,4096,14336,2,8,2,4,power_law_1.01,0.40451841354370116
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,4096,14336,2,8,2,4,power_law_1.01,0.6124800205230713
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,4096,14336,2,8,2,4,power_law_1.2,0.1300480008125305
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,4096,14336,2,8,2,4,power_law_1.01,0.88023681640625
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,4096,14336,2,8,2,4,power_law_1.01,0.0952127993106842
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,4096,14336,2,8,2,4,power_law_1.2,0.1512895941734314
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,4096,14336,2,8,2,4,power_law_1.01,1.2997119903564454
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,4096,14336,2,8,2,4,power_law_1.01,0.10844800472259522
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,4096,14336,2,8,2,4,power_law_1.01,1.6606527328491212
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,4096,14336,2,8,2,4,power_law_1.2,0.16122879981994628
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,4096,14336,2,8,2,4,power_law_1.01,0.11122560501098633
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,4096,14336,2,8,2,4,power_law_1.01,2.5135168075561523
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,4096,14336,2,8,2,4,power_law_1.2,0.16885759830474853
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,4096,14336,2,8,2,4,power_law_1.01,3.062611198425293
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,4096,14336,2,8,2,4,power_law_1.01,0.13660160303115845
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,4096,14336,2,8,2,4,power_law_1.2,0.18211840391159057
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,4096,14336,2,8,2,4,power_law_1.01,3.6619712829589846
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,4096,14336,2,8,2,4,power_law_1.2,0.1963263988494873
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,4096,14336,2,8,2,4,balanced,7.663002649943034
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,4096,14336,2,8,2,4,power_law_1.01,5.8323009490966795
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,4096,14336,2,8,2,4,power_law_1.2,0.21637120246887206
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,4096,14336,2,8,2,4,power_law_1.01,0.13443200588226317
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,4096,14336,2,8,2,4,power_law_1.01,12.548095703125
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,4096,14336,2,8,2,4,power_law_1.2,0.22728960514068602
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,4096,14336,2,8,2,4,power_law_1.01,0.14461439847946167
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,4096,14336,2,8,2,4,power_law_1.2,0.2510335922241211
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,4096,14336,2,8,2,4,power_law_1.01,0.16465280055999756
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,4096,14336,2,8,2,4,power_law_1.2,0.34948480129241943
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,4096,14336,2,8,2,4,power_law_1.01,0.1959936022758484
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,4096,14336,2,8,2,4,power_law_1.2,0.38646399974823
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,4096,14336,2,8,2,4,power_law_1.01,0.34962561130523684
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,4096,14336,2,8,2,4,power_law_1.2,0.6708223819732666
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,4096,14336,2,8,2,4,power_law_1.01,0.3608704090118408
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,4096,14336,2,8,2,4,power_law_1.2,0.73854079246521
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,4096,14336,2,8,2,4,power_law_1.01,0.7279295921325684
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,4096,14336,2,8,2,4,power_law_1.2,1.164896011352539
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,4096,14336,2,8,2,4,power_law_1.2,1.2977472305297852
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,4096,14336,2,8,2,4,power_law_1.01,0.8483648300170898
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,4096,14336,2,8,2,4,power_law_1.2,2.1254207611083986
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,4096,14336,2,8,2,4,power_law_1.01,0.9370368003845215
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,4096,14336,2,8,2,4,power_law_1.2,2.4111040115356444
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,4096,14336,2,8,2,4,power_law_1.01,1.930169677734375
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,4096,14336,2,8,2,4,power_law_1.2,3.8286209106445312
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,4096,14336,2,8,2,4,power_law_1.01,2.3648704528808593
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,4096,14336,2,8,2,4,power_law_1.2,5.7121025085449215
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,4096,14336,2,8,2,4,power_law_1.01,3.386540985107422
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,4096,14336,2,8,2,4,power_law_1.2,5.182092666625977
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,4096,14336,2,8,2,4,power_law_1.01,5.586816024780274
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,4096,14336,2,8,2,4,power_law_1.2,10.607859039306641
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,4096,14336,2,8,2,4,power_law_1.01,6.220774459838867
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,4096,14336,2,8,2,4,power_law_1.01,10.797209930419921
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,4096,14336,2,8,2,4,power_law_1.2,22.70142059326172
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,4096,14336,2,8,2,4,power_law_1.2,0.06844159960746765
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,4096,14336,2,8,2,4,power_law_1.01,23.285459899902342
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,4096,14336,2,8,2,4,power_law_1.2,0.07292159795761108
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,4096,14336,2,8,2,4,power_law_1.2,0.07022719979286193
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,4096,14336,2,8,2,4,power_law_1.2,0.07572479844093323
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,4096,14336,2,8,2,4,power_law_1.2,0.059008002281188965
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,4096,14336,2,8,4,2,balanced,0.052517334620157875
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,4096,14336,2,8,2,4,power_law_1.2,0.07509120106697083
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,4096,14336,2,8,2,4,power_law_1.2,0.06338559985160827
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,4096,14336,2,8,4,2,balanced,0.06717333197593689
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,4096,14336,2,8,2,4,power_law_1.2,0.06714879870414733
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,4096,14336,2,8,2,4,power_law_1.2,0.08123520016670227
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,4096,14336,2,8,4,2,balanced,0.10477866729100545
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,4096,14336,2,8,2,4,power_law_1.2,0.0706816017627716
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,4096,14336,2,8,2,4,power_law_1.2,0.0893119990825653
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,4096,14336,2,8,4,2,balanced,0.10803199807802837
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,4096,14336,2,8,2,4,power_law_1.2,0.07134079933166504
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,4096,14336,2,8,4,2,balanced,0.1074133316675822
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,4096,14336,2,8,2,4,power_law_1.2,0.08316799998283386
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,4096,14336,2,8,4,2,balanced,0.10948266585667928
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,4096,14336,2,8,2,4,power_law_1.2,0.07608320116996765
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,4096,14336,2,8,2,4,power_law_1.2,0.0910975992679596
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,4096,14336,2,8,4,2,balanced,0.11062399546305339
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,4096,14336,2,8,2,4,power_law_1.2,0.09069439768791199
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,4096,14336,2,8,2,4,power_law_1.2,0.0901632010936737
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,4096,14336,2,8,4,2,balanced,0.11205333471298218
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,4096,14336,2,8,2,4,power_law_1.2,0.10115840435028076
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,4096,14336,2,8,2,4,power_law_1.2,0.08769919872283935
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,4096,14336,2,8,4,2,balanced,0.11686399579048157
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,4096,14336,2,8,2,4,power_law_1.2,0.0946175992488861
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,4096,14336,2,8,4,2,balanced,0.11703999837239583
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,4096,14336,2,8,2,4,power_law_1.2,0.0986240029335022
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,4096,14336,2,8,2,4,power_law_1.2,0.1083840012550354
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,4096,14336,2,8,4,2,balanced,0.12329066793123881
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,4096,14336,2,8,2,4,power_law_1.2,0.10250879526138305
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,4096,14336,2,8,2,4,power_law_1.2,0.12065919637680053
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,4096,14336,2,8,4,2,balanced,0.12250666817029317
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,4096,14336,2,8,2,4,power_law_1.2,0.12312959432601929
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,4096,14336,2,8,4,2,balanced,0.12453866998354594
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,4096,14336,2,8,2,4,power_law_1.2,0.1350335955619812
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,4096,14336,2,8,2,4,power_law_1.2,0.0956928014755249
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,4096,14336,2,8,2,4,power_law_1.2,0.17080960273742676
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,4096,14336,2,8,4,2,balanced,0.12954666217168173
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,4096,14336,2,8,2,4,power_law_1.2,0.10932480096817017
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,4096,14336,2,8,2,4,power_law_1.2,0.24844799041748047
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,4096,14336,2,8,4,2,balanced,0.1346399982770284
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,4096,14336,2,8,2,4,power_law_1.2,0.10472320318222046
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,4096,14336,2,8,4,2,balanced,0.13532267014185587
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,4096,14336,2,8,2,4,power_law_1.2,0.1441151976585388
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,4096,14336,2,8,2,4,power_law_1.2,0.27696640491485597
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,4096,14336,2,8,4,2,balanced,0.16387733817100525
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,4096,14336,2,8,2,4,power_law_1.2,0.3671168088912964
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,4096,14336,2,8,4,2,balanced,0.17043733596801758
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,4096,14336,2,8,2,4,power_law_1.2,0.13932160139083863
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,4096,14336,2,8,2,4,power_law_1.2,0.362009596824646
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,4096,14336,2,8,4,2,balanced,0.18419732650121054
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,4096,14336,2,8,4,2,balanced,0.04045866678158442
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,4096,14336,2,8,2,4,power_law_1.2,0.13683199882507324
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,4096,14336,2,8,2,4,power_law_1.2,0.5862207889556885
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,4096,14336,2,8,4,2,balanced,0.25330666700998944
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,4096,14336,2,8,2,4,power_law_1.2,0.20565121173858641
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,4096,14336,2,8,4,2,balanced,0.05128000179926554
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,4096,14336,2,8,2,4,power_law_1.2,0.5960256099700928
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,4096,14336,2,8,4,2,balanced,0.3011359969774882
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,4096,14336,2,8,2,4,power_law_1.2,0.3087807893753052
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,4096,14336,2,8,4,2,balanced,0.07043733199437459
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,4096,14336,2,8,2,4,power_law_1.2,1.086303997039795
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,4096,14336,2,8,2,4,power_law_1.2,0.28640639781951904
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,4096,14336,2,8,4,2,balanced,0.42822933197021484
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,4096,14336,2,8,4,2,balanced,0.07294400036334991
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,4096,14336,2,8,2,4,power_law_1.2,1.4374719619750977
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,4096,14336,2,8,4,2,balanced,0.07467199862003326
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,4096,14336,2,8,4,2,balanced,0.5151093403498331
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,4096,14336,2,8,2,4,power_law_1.2,0.49868159294128417
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,4096,14336,2,8,2,4,power_law_1.2,2.692083168029785
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,4096,14336,2,8,4,2,balanced,0.075162669022878
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,4096,14336,2,8,2,4,power_law_1.2,0.6895040035247803
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,4096,14336,2,8,2,4,power_law_1.2,3.2195648193359374
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,4096,14336,2,8,4,2,balanced,0.7713706493377686
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,4096,14336,2,8,4,2,balanced,0.07614933451016744
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,4096,14336,2,8,2,4,power_law_1.2,0.9692607879638672
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,4096,14336,2,8,4,2,balanced,0.07625600198904674
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,4096,14336,2,8,2,4,power_law_1.2,3.2202049255371095
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,4096,14336,2,8,4,2,power_law_1.01,0.06257280111312866
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,4096,14336,2,8,4,2,balanced,0.9852906862894694
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,4096,14336,2,8,4,2,balanced,0.07674133280913036
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,4096,14336,2,8,2,4,power_law_1.2,1.3377599716186523
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,4096,14336,2,8,4,2,power_law_1.01,0.06654080152511596
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,4096,14336,2,8,2,4,power_law_1.2,6.433010864257812
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,4096,14336,2,8,4,2,balanced,0.07843199868996938
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,4096,14336,2,8,2,4,power_law_1.2,2.151699256896973
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,4096,14336,2,8,4,2,power_law_1.01,0.08432639837265014
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,4096,14336,2,8,4,2,balanced,1.4574987093607585
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,4096,14336,2,8,4,2,balanced,0.0795253316561381
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,4096,14336,2,8,2,4,power_law_1.2,13.290386962890626
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,4096,14336,2,8,4,2,power_law_1.01,0.10714880228042603
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,4096,14336,2,8,2,4,power_law_1.2,2.1457408905029296
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,4096,14336,2,8,4,2,balanced,0.07999999821186066
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,4096,14336,2,8,4,2,power_law_1.01,0.10281599760055542
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,4096,14336,2,8,2,4,power_law_1.2,3.373798370361328
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,4096,14336,2,8,4,2,balanced,0.08161066472530365
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,4096,14336,2,8,4,2,power_law_1.01,0.11207679510116578
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,4096,14336,2,8,4,2,balanced,1.9324639638264973
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,4096,14336,2,8,4,2,power_law_1.01,0.12288639545440674
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,4096,14336,2,8,2,4,power_law_1.2,5.938470458984375
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,4096,14336,2,8,4,2,balanced,0.08611200253168742
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,4096,14336,2,8,4,2,power_law_1.01,0.11980799436569214
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,4096,14336,2,8,4,2,balanced,0.09417066971460979
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,4096,14336,2,8,2,4,power_law_1.2,7.197907257080078
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,4096,14336,2,8,4,2,balanced,0.03382933388153712
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,4096,14336,2,8,4,2,power_law_1.01,0.13057279586791992
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,4096,14336,2,8,4,2,balanced,2.3660853703816733
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,4096,14336,2,8,4,2,balanced,0.0942186713218689
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,4096,14336,2,8,4,2,power_law_1.01,0.13614720106124878
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,4096,14336,2,8,4,2,balanced,0.04490133126576742
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,4096,14336,2,8,2,4,power_law_1.2,10.789286041259766
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,4096,14336,2,8,4,2,balanced,0.105813334385554
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,4096,14336,2,8,4,2,balanced,0.06554133196671803
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,4096,14336,2,8,4,2,power_law_1.01,0.15386879444122314
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,4096,14336,2,8,4,2,balanced,0.12268799543380737
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,4096,14336,2,8,4,2,balanced,0.06853866577148438
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,4096,14336,2,8,4,2,power_law_1.01,0.15943039655685426
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,4096,14336,2,8,2,4,power_law_1.2,23.807212829589844
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,4096,14336,2,8,4,2,balanced,0.13286933302879333
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,4096,14336,2,8,4,2,balanced,0.06997333467006683
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,4096,14336,2,8,4,2,power_law_1.01,0.1617535948753357
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,4096,14336,2,8,4,2,balanced,3.7869227727254233
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,4096,14336,2,8,4,2,balanced,0.07031466563542683
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,4096,14336,2,8,4,2,power_law_1.01,0.1801535964012146
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,4096,14336,2,8,4,2,balanced,0.17598400513331094
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,4096,14336,2,8,4,2,balanced,0.07205866773923238
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,4096,14336,2,8,4,2,power_law_1.01,0.17807999849319459
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,4096,14336,2,8,4,2,balanced,0.21572266022364298
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,4096,14336,2,8,4,2,balanced,0.07208000123500824
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,4096,14336,2,8,4,2,power_law_1.01,0.18082560300827027
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,4096,14336,2,8,4,2,balanced,0.3032533327738444
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,4096,14336,2,8,4,2,power_law_1.01,0.22498559951782227
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,4096,14336,2,8,4,2,balanced,0.36267733573913574
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,4096,14336,2,8,4,2,power_law_1.01,0.26696319580078126
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,4096,14336,2,8,4,2,power_law_1.01,0.27205119132995603
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,4096,14336,2,8,4,2,balanced,0.5302026669184366
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,4096,14336,2,8,4,2,power_law_1.01,0.04648320078849792
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,4096,14336,2,8,4,2,power_law_1.01,0.3875904083251953
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,4096,14336,2,8,4,2,balanced,0.07396799822648366
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,4096,14336,2,8,4,2,balanced,7.491498947143555
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,4096,14336,2,8,4,2,power_law_1.01,0.05451520085334778
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,4096,14336,2,8,4,2,power_law_1.01,0.46065921783447267
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,4096,14336,2,8,4,2,balanced,0.6756479740142822
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,4096,14336,2,8,4,2,balanced,0.07492800056934357
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,4096,14336,2,8,4,2,power_law_1.01,0.05617280006408691
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,4096,14336,2,8,4,2,power_law_1.01,0.6134975910186767
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,4096,14336,2,8,4,2,power_law_1.01,0.07249280214309692
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,4096,14336,2,8,4,2,power_law_1.01,0.07374719977378845
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,4096,14336,2,8,4,2,power_law_1.01,0.7833856105804443
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,4096,14336,2,8,4,2,balanced,0.9882986545562744
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,4096,14336,2,8,4,2,power_law_1.01,0.07789440155029297
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,4096,14336,2,8,4,2,power_law_1.01,1.233779239654541
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,4096,14336,2,8,4,2,power_law_1.01,0.07949439883232116
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,4096,14336,2,8,4,2,power_law_1.01,0.08455039858818054
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,4096,14336,2,8,4,2,power_law_1.01,1.3760767936706544
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,4096,14336,2,8,4,2,power_law_1.01,0.0840511977672577
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,4096,14336,2,8,4,2,balanced,1.298250675201416
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,4096,14336,2,8,4,2,power_law_1.01,0.08512639999389648
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,4096,14336,2,8,4,2,power_law_1.01,2.3198272705078127
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,4096,14336,2,8,4,2,power_law_1.01,0.08847360014915466
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,4096,14336,2,8,4,2,power_law_1.01,0.08945279717445373
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,4096,14336,2,8,4,2,power_law_1.01,2.833401679992676
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,4096,14336,2,8,4,2,balanced,0.0782239983479182
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,4096,14336,2,8,4,2,power_law_1.01,0.09267200231552124
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,4096,14336,2,8,4,2,power_law_1.01,0.11622400283813476
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,4096,14336,2,8,4,2,balanced,1.5909652709960938
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,4096,14336,2,8,4,2,power_law_1.01,3.8484798431396485
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,4096,14336,2,8,4,2,balanced,0.08021866778532664
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,4096,14336,2,8,4,2,power_law_1.01,0.12163840532302857
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,4096,14336,2,8,4,2,power_law_1.01,0.12237440347671509
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,4096,14336,2,8,4,2,balanced,0.08292266726493835
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,4096,14336,2,8,4,2,power_law_1.01,0.04286719858646393
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,4096,14336,2,8,4,2,power_law_1.01,5.743635177612305
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,4096,14336,2,8,4,2,power_law_1.01,0.13672319650650025
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,4096,14336,2,8,4,2,balanced,0.0841919978459676
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,4096,14336,2,8,4,2,power_law_1.01,0.18408960103988647
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,4096,14336,2,8,4,2,power_law_1.01,0.04805119931697845
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,4096,14336,2,8,4,2,power_law_1.01,0.18279680013656616
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,4096,14336,2,8,4,2,power_law_1.01,11.019641876220703
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,4096,14336,2,8,4,2,power_law_1.01,0.25547521114349364
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,4096,14336,2,8,4,2,power_law_1.01,0.05482239723205566
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,4096,14336,2,8,4,2,balanced,2.5249172846476235
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,4096,14336,2,8,4,2,power_law_1.01,0.28387839794158937
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,4096,14336,2,8,4,2,power_law_1.01,0.06958079934120179
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,4096,14336,2,8,4,2,power_law_1.01,0.44812798500061035
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,4096,14336,2,8,4,2,balanced,0.09594133496284485
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,4096,14336,2,8,4,2,power_law_1.01,0.06955519914627076
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,4096,14336,2,8,4,2,power_law_1.01,0.559980821609497
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,4096,14336,2,8,4,2,balanced,0.09834133585294087
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,4096,14336,2,8,4,2,power_law_1.01,0.7416255950927735
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,4096,14336,2,8,4,2,power_law_1.01,0.07969279885292054
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,4096,14336,2,8,4,2,power_law_1.01,0.9622400283813477
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,4096,14336,2,8,4,2,balanced,0.10409599542617798
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,4096,14336,2,8,4,2,power_law_1.01,0.08130559921264649
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,4096,14336,2,8,4,2,power_law_1.01,1.2221376419067382
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,4096,14336,2,8,4,2,balanced,0.14589866995811462
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,4096,14336,2,8,4,2,power_law_1.01,1.869990348815918
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,4096,14336,2,8,4,2,power_law_1.01,0.08710399866104127
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,4096,14336,2,8,4,2,balanced,0.15589333573977152
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,4096,14336,2,8,4,2,power_law_1.01,2.354419136047363
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,4096,14336,2,8,4,2,power_law_1.01,3.98205451965332
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,4096,14336,2,8,4,2,balanced,4.966287930806478
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,4096,14336,2,8,4,2,balanced,0.21618133783340454
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,4096,14336,2,8,4,2,power_law_1.01,0.08470399975776673
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,4096,14336,2,8,4,2,power_law_1.01,8.110438537597656
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,4096,14336,2,8,4,2,balanced,0.26930665969848633
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,4096,14336,2,8,4,2,power_law_1.01,0.0884607970714569
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,4096,14336,2,8,4,2,power_law_1.01,0.0921280026435852
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,4096,14336,2,8,4,2,balanced,0.42209601402282715
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,4096,14336,2,8,4,2,power_law_1.01,0.0966592013835907
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,4096,14336,2,8,4,2,power_law_1.01,0.09911680221557617
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,4096,14336,2,8,4,2,balanced,0.5746773481369019
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,4096,14336,2,8,4,2,power_law_1.01,0.1057088017463684
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,4096,14336,2,8,4,2,balanced,0.8501439889272054
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,4096,14336,2,8,4,2,power_law_1.01,0.11790080070495605
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,4096,14336,2,8,4,2,balanced,1.1194026470184326
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,4096,14336,2,8,4,2,power_law_1.01,0.12815359830856324
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,4096,14336,2,8,4,2,power_law_1.01,0.1492095947265625
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,4096,14336,2,8,4,2,balanced,1.654703934987386
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,4096,14336,2,8,4,2,power_law_1.01,0.19800959825515746
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,4096,14336,2,8,4,2,power_law_1.01,0.2355072021484375
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,4096,14336,2,8,4,2,power_law_1.01,0.33889920711517335
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,4096,14336,2,8,4,2,balanced,2.1909173329671225
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,4096,14336,2,8,4,2,power_law_1.01,0.4571712017059326
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,4096,14336,2,8,4,2,power_law_1.01,0.6609536170959472
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,4096,14336,2,8,4,2,balanced,2.721872011820475
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,4096,14336,2,8,4,2,power_law_1.01,0.8428223609924317
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,4096,14336,2,8,4,2,power_law_1.01,1.2609984397888183
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,4096,14336,2,8,4,2,power_law_1.01,1.5160703659057617
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,4096,14336,2,8,4,2,balanced,4.341093381245931
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,4096,14336,2,8,4,2,power_law_1.2,0.0626688003540039
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,4096,14336,2,8,4,2,power_law_1.01,2.549247932434082
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,4096,14336,2,8,4,2,power_law_1.2,0.07332479953765869
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,4096,14336,2,8,4,2,power_law_1.01,3.548748779296875
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,4096,14336,2,8,4,2,power_law_1.2,0.06977919936180114
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,4096,14336,2,8,4,2,power_law_1.01,4.537721633911133
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,4096,14336,2,8,4,2,power_law_1.2,0.10684159994125367
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,4096,14336,2,8,4,2,power_law_1.2,0.10648319721221924
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,4096,14336,2,8,4,2,power_law_1.01,6.672889709472656
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,4096,14336,2,8,4,2,power_law_1.2,0.10865919589996338
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,4096,14336,2,8,4,2,power_law_1.2,0.13045120239257812
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,4096,14336,2,8,4,2,power_law_1.2,0.04478079974651337
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,4096,14336,2,8,4,2,balanced,8.651973088582357
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,4096,14336,2,8,4,2,power_law_1.01,15.010931396484375
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,4096,14336,2,8,4,2,power_law_1.2,0.12216960191726685
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,4096,14336,2,8,4,2,power_law_1.2,0.043372800946235655
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,4096,14336,2,8,4,2,power_law_1.2,0.12301440238952636
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,4096,14336,2,8,4,2,power_law_1.2,0.056006401777267456
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,4096,14336,2,8,4,2,power_law_1.2,0.14064639806747437
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,4096,14336,2,8,4,2,power_law_1.2,0.07194240093231201
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,4096,14336,2,8,4,2,power_law_1.2,0.15602560043334962
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,4096,14336,2,8,4,2,power_law_1.2,0.07246080040931702
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,4096,14336,2,8,4,2,power_law_1.2,0.15936000347137452
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,4096,14336,2,8,4,2,power_law_1.2,0.07919999957084656
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,4096,14336,2,8,4,2,power_law_1.2,0.16034560203552245
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,4096,14336,2,8,4,2,power_law_1.2,0.08004480004310607
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,4096,14336,2,8,4,2,power_law_1.2,0.1751871943473816
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,4096,14336,2,8,4,2,power_law_1.2,0.08218880295753479
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,4096,14336,2,8,4,2,power_law_1.2,0.18076800107955932
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,4096,14336,2,8,4,2,power_law_1.2,0.040755200386047366
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,4096,14336,2,8,4,2,power_law_1.2,0.08146560192108154
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,4096,14336,2,8,4,2,power_law_1.2,0.18328959941864015
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,4096,14336,2,8,4,2,power_law_1.2,0.04761599898338318
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,4096,14336,2,8,4,2,power_law_1.2,0.08537600040435792
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,4096,14336,2,8,4,2,power_law_1.2,0.21783039569854737
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,4096,14336,2,8,4,2,power_law_1.2,0.04952319860458374
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,4096,14336,2,8,4,2,power_law_1.2,0.2660032033920288
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,4096,14336,2,8,4,2,power_law_1.2,0.08749439716339111
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,4096,14336,2,8,4,2,power_law_1.2,0.06707839965820313
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,4096,14336,2,8,4,2,power_law_1.2,0.0906112015247345
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,4096,14336,2,8,4,2,power_law_1.2,0.2923840045928955
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,4096,14336,2,8,4,2,power_law_1.2,0.06932479739189149
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,4096,14336,2,8,4,2,power_law_1.2,0.09640960097312927
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,4096,14336,2,8,4,2,power_law_1.2,0.44080638885498047
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,4096,14336,2,8,4,2,power_law_1.2,0.08161919713020324
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,4096,14336,2,8,4,2,power_law_1.2,0.4517504215240479
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,4096,14336,2,8,4,2,power_law_1.2,0.11659519672393799
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,4096,14336,2,8,4,2,power_law_1.2,0.08108800053596496
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,4096,14336,2,8,4,2,power_law_1.2,0.7092160224914551
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,4096,14336,2,8,4,2,power_law_1.2,0.12331520318984986
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,4096,14336,2,8,4,2,power_law_1.2,0.08499199748039246
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,4096,14336,2,8,4,2,power_law_1.2,0.9092864036560059
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,4096,14336,2,8,4,2,power_law_1.2,0.12120959758758545
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,4096,14336,2,8,4,2,power_law_1.2,1.1880064010620117
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,4096,14336,2,8,4,2,power_law_1.2,0.12252160310745239
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,4096,14336,2,8,4,2,power_law_1.2,0.08675839900970458
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,4096,14336,2,8,4,2,power_law_1.2,0.17713279724121095
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,4096,14336,2,8,4,2,power_law_1.2,1.6677631378173827
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,4096,14336,2,8,4,2,power_law_1.2,0.09310719966888428
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,4096,14336,2,8,4,2,power_law_1.2,0.1923200011253357
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,4096,14336,2,8,4,2,power_law_1.2,2.2332672119140624
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,4096,14336,2,8,8,1,balanced,0.048826664686203
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,4096,14336,2,8,4,2,power_law_1.2,0.23527040481567382
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,4096,14336,2,8,4,2,power_law_1.2,3.3994686126708986
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,4096,14336,2,8,8,1,balanced,0.06711466610431671
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,4096,14336,2,8,4,2,power_law_1.2,0.28665599822998045
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,4096,14336,2,8,4,2,power_law_1.2,0.09249280095100403
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,4096,14336,2,8,4,2,power_law_1.2,3.061939239501953
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,4096,14336,2,8,8,1,balanced,0.1051626702149709
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,4096,14336,2,8,4,2,power_law_1.2,0.4523200035095215
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,4096,14336,2,8,4,2,power_law_1.2,0.09809920191764832
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,4096,14336,2,8,8,1,balanced,0.10859200358390808
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,4096,14336,2,8,4,2,power_law_1.2,6.531270599365234
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,4096,14336,2,8,4,2,power_law_1.2,0.5455743789672851
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,4096,14336,2,8,4,2,power_law_1.2,0.09608319997787476
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,4096,14336,2,8,8,1,balanced,0.10847466190656026
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,4096,14336,2,8,4,2,power_law_1.2,0.10983680486679077
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,4096,14336,2,8,4,2,power_law_1.2,0.8126463890075684
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,4096,14336,2,8,4,2,power_law_1.2,12.010848236083984
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,4096,14336,2,8,8,1,balanced,0.11019733548164368
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,4096,14336,2,8,4,2,power_law_1.2,0.9842047691345215
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,4096,14336,2,8,8,1,balanced,0.1107360025246938
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,4096,14336,2,8,4,2,power_law_1.2,0.12307840585708618
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,4096,14336,2,8,4,2,power_law_1.2,1.3927424430847168
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,4096,14336,2,8,8,1,balanced,0.11106133460998535
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,4096,14336,2,8,4,2,power_law_1.2,0.1288256049156189
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,4096,14336,2,8,8,1,balanced,0.03873066604137421
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,4096,14336,2,8,4,2,power_law_1.2,0.15456639528274535
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,4096,14336,2,8,8,1,balanced,0.11757866541544597
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,4096,14336,2,8,4,2,power_law_1.2,2.130975914001465
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,4096,14336,2,8,8,1,balanced,0.05062933266162872
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,4096,14336,2,8,4,2,power_law_1.2,0.19432320594787597
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,4096,14336,2,8,8,1,balanced,0.11684266726175944
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,4096,14336,2,8,4,2,power_law_1.2,2.038150405883789
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,4096,14336,2,8,8,1,balanced,0.07167466481526692
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,4096,14336,2,8,4,2,power_law_1.2,0.23357439041137695
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,4096,14336,2,8,8,1,balanced,0.11876266201337178
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,4096,14336,2,8,8,1,balanced,0.07421866556008656
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,4096,14336,2,8,4,2,power_law_1.2,3.954547119140625
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,4096,14336,2,8,4,2,power_law_1.2,0.33646080493927
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,4096,14336,2,8,8,1,balanced,0.12114666899045308
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,4096,14336,2,8,8,1,balanced,0.07517333328723907
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,4096,14336,2,8,4,2,power_law_1.2,0.5143040180206299
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,4096,14336,2,8,8,1,balanced,0.12203199664751689
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,4096,14336,2,8,4,2,power_law_1.2,8.273177337646484
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,4096,14336,2,8,8,1,balanced,0.07622933387756348
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,4096,14336,2,8,8,1,balanced,0.1318773329257965
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,4096,14336,2,8,4,2,power_law_1.2,0.7403584003448487
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,4096,14336,2,8,8,1,balanced,0.07687999804814656
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,4096,14336,2,8,8,1,balanced,0.1390773355960846
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,4096,14336,2,8,4,2,power_law_1.2,0.8731840133666993
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,4096,14336,2,8,8,1,balanced,0.07681066791216533
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,4096,14336,2,8,8,1,balanced,0.03359466542800268
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,4096,14336,2,8,8,1,balanced,0.13940266768137613
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,4096,14336,2,8,8,1,balanced,0.07765866816043854
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,4096,14336,2,8,4,2,power_law_1.2,1.5433407783508302
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,4096,14336,2,8,8,1,balanced,0.04535466432571411
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,4096,14336,2,8,8,1,balanced,0.16249600052833557
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,4096,14336,2,8,8,1,balanced,0.06551466882228851
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,4096,14336,2,8,8,1,balanced,0.07787733276685078
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,4096,14336,2,8,4,2,power_law_1.2,1.7438528060913085
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,4096,14336,2,8,8,1,balanced,0.18411733706792197
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,4096,14336,2,8,8,1,balanced,0.0684746652841568
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,4096,14336,2,8,8,1,balanced,0.07975466549396515
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,4096,14336,2,8,8,1,balanced,0.07010133564472198
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,4096,14336,2,8,4,2,power_law_1.2,2.392857551574707
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,4096,14336,2,8,8,1,balanced,0.19203199942906699
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,4096,14336,2,8,8,1,balanced,0.07132799923419952
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,4096,14336,2,8,8,1,balanced,0.08250133196512859
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,4096,14336,2,8,8,1,balanced,0.07285333176453908
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,4096,14336,2,8,4,2,power_law_1.2,3.8111873626708985
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,4096,14336,2,8,8,1,balanced,0.25525333484013873
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,4096,14336,2,8,8,1,balanced,0.08390399813652039
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,4096,14336,2,8,8,1,balanced,0.07289066910743713
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,4096,14336,2,8,4,2,power_law_1.2,4.470419311523438
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,4096,14336,2,8,8,1,balanced,0.3216106692949931
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,4096,14336,2,8,8,1,balanced,0.09066667159398396
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,4096,14336,2,8,8,1,balanced,0.09742400050163269
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,4096,14336,2,8,8,1,balanced,0.4618399937947591
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,4096,14336,2,8,4,2,power_law_1.2,6.287846374511719
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,4096,14336,2,8,8,1,balanced,0.0992746651172638
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,4096,14336,2,8,8,1,balanced,0.5618773301442465
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,4096,14336,2,8,8,1,balanced,0.07629866898059845
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,4096,14336,2,8,8,1,balanced,0.10471999645233154
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,4096,14336,2,8,4,2,power_law_1.2,14.808262634277344
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,4096,14336,2,8,8,1,balanced,0.0777706652879715
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,4096,14336,2,8,8,1,balanced,0.1426400045553843
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,4096,14336,2,8,8,1,balanced,0.8323573271433512
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,4096,14336,2,8,8,1,balanced,0.14722667137781778
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,4096,14336,2,8,8,1,balanced,1.075978676478068
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,4096,14336,2,8,8,1,balanced,0.19489065806070963
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,4096,14336,2,8,8,1,balanced,0.23972799380620322
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,4096,14336,2,8,8,1,balanced,1.5860053698221843
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,4096,14336,2,8,8,1,balanced,0.33961065610249835
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,4096,14336,2,8,8,1,balanced,0.41597334543863934
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,4096,14336,2,8,8,1,balanced,2.109007994333903
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,4096,14336,2,8,8,1,balanced,0.08177066842714946
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,4096,14336,2,8,8,1,power_law_1.01,0.04802559912204742
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,4096,14336,2,8,8,1,balanced,0.6090133190155029
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,4096,14336,2,8,8,1,balanced,0.08525333801905315
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,4096,14336,2,8,8,1,balanced,0.08781333764394124
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,4096,14336,2,8,8,1,power_law_1.01,0.06220800280570984
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,4096,14336,2,8,8,1,balanced,0.09141332904497783
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,4096,14336,2,8,8,1,balanced,2.6053013801574707
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,4096,14336,2,8,8,1,power_law_1.01,0.07373440265655518
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,4096,14336,2,8,8,1,balanced,0.7850773334503174
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,4096,14336,2,8,8,1,power_law_1.01,0.10408960580825806
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,4096,14336,2,8,8,1,power_law_1.01,0.10302079916000366
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,4096,14336,2,8,8,1,balanced,1.1610133647918701
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,4096,14336,2,8,8,1,power_law_1.01,0.11126400232315063
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,4096,14336,2,8,8,1,balanced,0.10709866881370544
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,4096,14336,2,8,8,1,power_law_1.01,0.11646720170974731
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,4096,14336,2,8,8,1,balanced,0.11098133524258931
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,4096,14336,2,8,8,1,balanced,4.049002647399902
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,4096,14336,2,8,8,1,power_law_1.01,0.11737600564956666
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,4096,14336,2,8,8,1,power_law_1.01,0.039129599928855896
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,4096,14336,2,8,8,1,balanced,0.11919466654459636
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,4096,14336,2,8,8,1,balanced,1.5208853085835774
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,4096,14336,2,8,8,1,power_law_1.01,0.11838079690933227
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,4096,14336,2,8,8,1,balanced,0.16967999935150146
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,4096,14336,2,8,8,1,power_law_1.01,0.045875200629234315
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,4096,14336,2,8,8,1,balanced,0.18557333946228027
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,4096,14336,2,8,8,1,power_law_1.01,0.12062079906463623
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,4096,14336,2,8,8,1,power_law_1.01,0.04937599897384644
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,4096,14336,2,8,8,1,balanced,0.2688106695810954
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,4096,14336,2,8,8,1,power_law_1.01,0.12599040269851686
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,4096,14336,2,8,8,1,power_law_1.01,0.0713919997215271
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,4096,14336,2,8,8,1,balanced,0.35734931627909344
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,4096,14336,2,8,8,1,balanced,1.8629226684570312
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,4096,14336,2,8,8,1,power_law_1.01,0.13460479974746703
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,4096,14336,2,8,8,1,power_law_1.01,0.07266560196876526
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,4096,14336,2,8,8,1,power_law_1.01,0.13523199558258056
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,4096,14336,2,8,8,1,power_law_1.01,0.0760320007801056
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,4096,14336,2,8,8,1,power_law_1.01,0.15639679431915282
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,4096,14336,2,8,8,1,power_law_1.01,0.07631360292434693
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,4096,14336,2,8,8,1,power_law_1.01,0.1803007960319519
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,4096,14336,2,8,8,1,power_law_1.01,0.07562879920005798
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,4096,14336,2,8,8,1,balanced,0.5394186576207479
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,4096,14336,2,8,8,1,balanced,8.053850809733072
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,4096,14336,2,8,8,1,balanced,2.932736078898112
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,4096,14336,2,8,8,1,power_law_1.01,0.1853824019432068
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,4096,14336,2,8,8,1,power_law_1.01,0.08141440153121948
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,4096,14336,2,8,8,1,balanced,0.7007893721262614
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,4096,14336,2,8,8,1,power_law_1.01,0.21188480854034425
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,4096,14336,2,8,8,1,power_law_1.01,0.08217599987983704
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,4096,14336,2,8,8,1,balanced,1.0386772950490315
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,4096,14336,2,8,8,1,power_law_1.01,0.23994879722595214
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,4096,14336,2,8,8,1,power_law_1.01,0.08335999846458435
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,4096,14336,2,8,8,1,balanced,1.3943626085917156
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,4096,14336,2,8,8,1,power_law_1.01,0.08688639998435974
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,4096,14336,2,8,8,1,power_law_1.01,0.246995210647583
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,4096,14336,2,8,8,1,power_law_1.01,0.0912447988986969
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,4096,14336,2,8,8,1,power_law_1.01,0.30624639987945557
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,4096,14336,2,8,8,1,balanced,2.0419467290242515
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,4096,14336,2,8,8,1,power_law_1.01,0.11326719522476196
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,4096,14336,2,8,8,1,power_law_1.01,0.3582911968231201
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,4096,14336,2,8,8,1,power_law_1.01,0.48200321197509766
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,4096,14336,2,8,8,1,balanced,5.765077590942383
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,4096,14336,2,8,8,1,power_law_1.01,0.12547839879989625
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,4096,14336,2,8,8,1,balanced,2.715749422709147
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,4096,14336,2,8,8,1,power_law_1.01,0.6106751918792724
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,4096,14336,2,8,8,1,power_law_1.01,0.12473599910736084
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,4096,14336,2,8,8,1,power_law_1.01,0.8453951835632324
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,4096,14336,2,8,8,1,power_law_1.01,0.12599040269851686
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,4096,14336,2,8,8,1,power_law_1.01,0.1463104009628296
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,4096,14336,2,8,8,1,balanced,3.3772265116373696
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,4096,14336,2,8,8,1,power_law_1.01,1.0829567909240723
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,4096,14336,2,8,8,1,power_law_1.01,0.1702656030654907
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,4096,14336,2,8,8,1,power_law_1.01,1.6224319458007812
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,4096,14336,2,8,8,1,power_law_1.01,0.21751039028167723
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,4096,14336,2,8,8,1,power_law_1.01,2.1860416412353514
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,4096,14336,2,8,8,1,power_law_1.01,0.24980480670928956
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,4096,14336,2,8,8,1,power_law_1.01,2.7216320037841797
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,4096,14336,2,8,8,1,balanced,5.38148816426595
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,4096,14336,2,8,8,1,power_law_1.01,0.3474623918533325
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,4096,14336,2,8,8,1,power_law_1.01,4.0444286346435545
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,4096,14336,2,8,8,1,power_law_1.01,0.44155521392822267
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,4096,14336,2,8,8,1,power_law_1.01,0.03370240032672882
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,4096,14336,2,8,8,1,power_law_1.01,8.026617431640625
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,4096,14336,2,8,8,1,power_law_1.01,0.6350207805633545
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,4096,14336,2,8,8,1,power_law_1.01,0.03900800049304962
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,4096,14336,2,8,8,1,power_law_1.01,0.787391996383667
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,4096,14336,2,8,8,1,power_law_1.01,0.042803201079368594
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,4096,14336,2,8,8,1,power_law_1.01,1.144761562347412
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,4096,14336,2,8,8,1,power_law_1.2,0.047891199588775635
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,4096,14336,2,8,8,1,power_law_1.01,0.06625279784202576
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,4096,14336,2,8,8,1,power_law_1.01,1.5352383613586427
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,4096,14336,2,8,8,1,balanced,10.724000295003256
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,4096,14336,2,8,8,1,power_law_1.2,0.0608959972858429
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,4096,14336,2,8,8,1,power_law_1.01,0.06762880086898804
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,4096,14336,2,8,8,1,power_law_1.01,1.9133760452270507
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,4096,14336,2,8,8,1,power_law_1.2,0.0695680022239685
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,4096,14336,2,8,8,1,power_law_1.01,0.07566720247268677
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,4096,14336,2,8,8,1,power_law_1.01,2.944550323486328
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,4096,14336,2,8,8,1,power_law_1.2,0.10428800582885742
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,4096,14336,2,8,8,1,power_law_1.01,0.08018559813499451
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,4096,14336,2,8,8,1,power_law_1.2,0.10628479719161987
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,4096,14336,2,8,8,1,power_law_1.01,5.791142272949219
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,4096,14336,2,8,8,1,power_law_1.01,0.08144639730453491
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,4096,14336,2,8,8,1,power_law_1.2,0.11322879791259766
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,4096,14336,2,8,8,1,power_law_1.2,0.11567360162734985
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,4096,14336,2,8,8,1,power_law_1.01,0.08416640162467956
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,4096,14336,2,8,8,1,power_law_1.2,0.11619199514389038
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,4096,14336,2,8,8,1,power_law_1.01,0.08871039748191833
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,4096,14336,2,8,8,1,power_law_1.2,0.11872639656066894
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,4096,14336,2,8,8,1,power_law_1.2,0.12001919746398926
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,4096,14336,2,8,8,1,power_law_1.01,0.09324799776077271
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,4096,14336,2,8,8,1,power_law_1.2,0.12846720218658447
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,4096,14336,2,8,8,1,power_law_1.01,0.09395840167999267
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,4096,14336,2,8,8,1,power_law_1.2,0.13215359449386596
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,4096,14336,2,8,8,1,power_law_1.2,0.13397120237350463
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,4096,14336,2,8,8,1,power_law_1.01,0.09488000273704529
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,4096,14336,2,8,8,1,power_law_1.2,0.038899201154708865
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,4096,14336,2,8,8,1,power_law_1.2,0.1578495979309082
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,4096,14336,2,8,8,1,power_law_1.01,0.10786559581756591
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,4096,14336,2,8,8,1,power_law_1.2,0.04497919976711273
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,4096,14336,2,8,8,1,power_law_1.2,0.18056319952011107
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,4096,14336,2,8,8,1,power_law_1.2,0.04809600114822388
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,4096,14336,2,8,8,1,power_law_1.01,0.12023680210113526
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,4096,14336,2,8,8,1,power_law_1.2,0.1797824025154114
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,4096,14336,2,8,8,1,power_law_1.2,0.07162240147590637
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,4096,14336,2,8,8,1,power_law_1.01,0.12693120241165162
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,4096,14336,2,8,8,1,power_law_1.2,0.20315520763397216
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,4096,14336,2,8,8,1,power_law_1.2,0.07399680018424988
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,4096,14336,2,8,8,1,power_law_1.01,0.14686720371246337
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,4096,14336,2,8,8,1,power_law_1.2,0.231660795211792
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,4096,14336,2,8,8,1,power_law_1.2,0.0762112021446228
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,4096,14336,2,8,8,1,power_law_1.01,0.1782271981239319
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,4096,14336,2,8,8,1,power_law_1.2,0.244486403465271
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,4096,14336,2,8,8,1,power_law_1.2,0.07683200240135193
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,4096,14336,2,8,8,1,power_law_1.01,0.2196671962738037
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,4096,14336,2,8,8,1,power_law_1.2,0.3108479976654053
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,4096,14336,2,8,8,1,power_law_1.2,0.07749119997024537
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,4096,14336,2,8,8,1,power_law_1.01,0.3011840105056763
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,4096,14336,2,8,8,1,power_law_1.2,0.36207358837127684
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,4096,14336,2,8,8,1,power_law_1.2,0.08227840065956116
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,4096,14336,2,8,8,1,power_law_1.01,0.3824064016342163
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,4096,14336,2,8,8,1,power_law_1.2,0.4879487991333008
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,4096,14336,2,8,8,1,power_law_1.2,0.08264960050582885
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,4096,14336,2,8,8,1,power_law_1.2,0.6143295764923096
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,4096,14336,2,8,8,1,power_law_1.2,0.08469120264053345
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,4096,14336,2,8,8,1,power_law_1.01,0.56943359375
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,4096,14336,2,8,8,1,power_law_1.2,0.8509504318237304
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,4096,14336,2,8,8,1,power_law_1.2,0.08706560134887695
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,4096,14336,2,8,8,1,power_law_1.01,0.733241605758667
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,4096,14336,2,8,8,1,power_law_1.2,1.1287103652954102
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,4096,14336,2,8,8,1,power_law_1.2,0.09130880236625671
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,4096,14336,2,8,8,1,power_law_1.01,1.0660927772521973
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,4096,14336,2,8,8,1,power_law_1.2,1.6246528625488281
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,4096,14336,2,8,8,1,power_law_1.2,0.10675840377807617
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,4096,14336,2,8,8,1,power_law_1.01,1.406719970703125
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,4096,14336,2,8,8,1,power_law_1.2,0.12167680263519287
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,4096,14336,2,8,8,1,power_law_1.2,2.209702491760254
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,4096,14336,2,8,8,1,power_law_1.01,2.0695104598999023
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,4096,14336,2,8,8,1,power_law_1.2,0.12276480197906495
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,4096,14336,2,8,8,1,power_law_1.2,2.753228759765625
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,4096,14336,2,8,8,1,power_law_1.2,0.12225279808044434
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,4096,14336,2,8,8,1,power_law_1.01,2.749388885498047
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,4096,14336,2,8,8,1,power_law_1.2,4.078086471557617
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,4096,14336,2,8,8,1,power_law_1.2,0.14921599626541138
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,4096,14336,2,8,8,1,power_law_1.01,3.3927616119384765
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,4096,14336,2,8,8,1,power_law_1.2,0.17195520401000977
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,4096,14336,2,8,8,1,power_law_1.2,8.102623748779298
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,4096,14336,2,8,8,1,power_law_1.2,0.2185215950012207
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,4096,14336,2,8,8,1,power_law_1.01,5.399801635742188
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,4096,14336,2,8,8,1,power_law_1.2,0.25394558906555176
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,4096,14336,2,8,8,1,power_law_1.2,0.3503871917724609
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,4096,14336,2,8,8,1,power_law_1.01,10.743827056884765
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,4096,14336,2,8,8,1,power_law_1.2,0.03356800079345703
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,4096,14336,2,8,8,1,power_law_1.2,0.4405055999755859
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,4096,14336,2,8,8,1,power_law_1.2,0.037868800759315493
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,4096,14336,2,8,8,1,power_law_1.2,0.6304704189300537
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,4096,14336,2,8,8,1,power_law_1.2,0.047788798809051514
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,4096,14336,2,8,8,1,power_law_1.2,0.7917823791503906
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,4096,14336,2,8,8,1,power_law_1.2,0.06828799843788147
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,6144,16384,2,8,1,8,balanced,0.18184000253677368
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,4096,14336,2,8,8,1,power_law_1.2,1.1457023620605469
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,4096,14336,2,8,8,1,power_law_1.2,0.06715520024299622
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,6144,16384,2,8,1,8,balanced,0.17252800861994425
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,4096,14336,2,8,8,1,power_law_1.2,1.5570624351501465
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,4096,14336,2,8,8,1,power_law_1.2,0.07585279941558838
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,6144,16384,2,8,1,8,balanced,0.17254400253295898
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,4096,14336,2,8,8,1,power_law_1.2,1.9250112533569337
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,6144,16384,2,8,1,8,balanced,0.17148800690968832
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,4096,14336,2,8,8,1,power_law_1.2,0.08000640273094177
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,4096,14336,2,8,8,1,power_law_1.2,2.945952033996582
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,6144,16384,2,8,1,8,balanced,0.1690773367881775
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,4096,14336,2,8,8,1,power_law_1.2,0.08353279829025269
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,4096,14336,2,8,8,1,power_law_1.2,5.764588928222656
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,6144,16384,2,8,1,8,balanced,0.16932799418767294
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,6144,16384,2,8,1,8,balanced,0.17011733849843344
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,4096,14336,2,8,8,1,power_law_1.2,0.08439679741859436
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,6144,16384,2,8,1,8,balanced,0.1742453376452128
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,4096,14336,2,8,8,1,power_law_1.2,0.09051520228385926
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,6144,16384,2,8,1,8,balanced,0.18119466304779053
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,6144,16384,2,8,1,8,balanced,0.17857599258422852
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,6144,16384,2,8,1,8,balanced,0.19365866978963217
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,4096,14336,2,8,8,1,power_law_1.2,0.08924800157546997
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,6144,16384,2,8,1,8,balanced,0.18434667587280273
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,4096,14336,2,8,8,1,power_law_1.2,0.09193599820137024
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,4096,14336,2,8,8,1,power_law_1.2,0.09573760032653808
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,6144,16384,2,8,1,8,balanced,0.1819360057512919
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,4096,14336,2,8,8,1,power_law_1.2,0.10968960523605346
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,6144,16384,2,8,1,8,balanced,0.19233065843582153
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,6144,16384,2,8,1,8,balanced,0.11390399932861328
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,6144,16384,2,8,1,8,balanced,0.24356265862782797
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,4096,14336,2,8,8,1,power_law_1.2,0.11804800033569336
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,6144,16384,2,8,1,8,balanced,0.24940266211827597
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,6144,16384,2,8,1,8,balanced,0.10956266522407532
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,4096,14336,2,8,8,1,power_law_1.2,0.12341120243072509
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,6144,16384,2,8,1,8,balanced,0.10956799983978271
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,6144,16384,2,8,1,8,balanced,0.22588266928990683
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,4096,14336,2,8,8,1,power_law_1.2,0.14612480401992797
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,6144,16384,2,8,1,8,balanced,0.11016000310579936
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,6144,16384,2,8,1,8,balanced,0.301418662071228
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,4096,14336,2,8,8,1,power_law_1.2,0.18557440042495726
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,6144,16384,2,8,1,8,balanced,0.11014933387438457
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,6144,16384,2,8,1,8,balanced,0.25837333997090656
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,4096,14336,2,8,8,1,power_law_1.2,0.22521600723266602
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,6144,16384,2,8,1,8,balanced,0.11029866337776184
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,4096,14336,2,8,8,1,power_law_1.2,0.2977792024612427
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,6144,16384,2,8,1,8,balanced,0.4457813501358032
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,6144,16384,2,8,1,8,balanced,0.11040533582369487
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,4096,14336,2,8,8,1,power_law_1.2,0.3848896026611328
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,6144,16384,2,8,1,8,power_law_1.01,0.17991679906845093
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,6144,16384,2,8,1,8,balanced,0.4422186613082886
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,6144,16384,2,8,1,8,balanced,0.11387200156847636
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,6144,16384,2,8,1,8,balanced,0.11001066366831462
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,6144,16384,2,8,1,8,power_law_1.01,0.1722815990447998
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,6144,16384,2,8,1,8,balanced,0.7269386450449625
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,6144,16384,2,8,1,8,balanced,0.11379200220108032
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,4096,14336,2,8,8,1,power_law_1.2,0.5637824058532714
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,6144,16384,2,8,1,8,power_law_1.01,0.1712767958641052
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,6144,16384,2,8,1,8,balanced,0.10313066840171814
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,6144,16384,2,8,1,8,balanced,0.11416000127792358
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,4096,14336,2,8,8,1,power_law_1.2,0.7280128002166748
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,6144,16384,2,8,1,8,balanced,0.8043946425120035
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,6144,16384,2,8,1,8,power_law_1.01,0.16963839530944824
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,6144,16384,2,8,1,8,balanced,0.10225600004196167
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,6144,16384,2,8,1,8,balanced,0.12415466705958049
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,4096,14336,2,8,8,1,power_law_1.2,1.0651840209960937
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,6144,16384,2,8,1,8,power_law_1.01,0.16858240365982055
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,6144,16384,2,8,1,8,balanced,0.10522133111953735
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,6144,16384,2,8,1,8,balanced,0.11611732840538025
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,6144,16384,2,8,1,8,balanced,1.2187146345774333
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,4096,14336,2,8,8,1,power_law_1.2,1.3840703964233398
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,6144,16384,2,8,1,8,power_law_1.01,0.1879680037498474
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,6144,16384,2,8,1,8,balanced,0.107013334830602
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,6144,16384,2,8,1,8,balanced,0.11642133196194966
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,4096,14336,2,8,8,1,power_law_1.2,2.0658943176269533
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,6144,16384,2,8,1,8,power_law_1.01,0.20977280139923096
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,6144,16384,2,8,1,8,balanced,0.10831466317176819
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,6144,16384,2,8,1,8,balanced,1.5139306386311848
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,6144,16384,2,8,1,8,balanced,0.1275146702925364
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,6144,16384,2,8,1,8,power_law_1.01,0.19587199687957763
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,4096,14336,2,8,8,1,power_law_1.2,2.733260726928711
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,6144,16384,2,8,1,8,balanced,0.10890666643778484
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,6144,16384,2,8,1,8,balanced,0.1444480021794637
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,6144,16384,2,8,1,8,power_law_1.01,0.2261888027191162
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,6144,16384,2,8,1,8,balanced,0.10883733630180359
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,4096,14336,2,8,8,1,power_law_1.2,3.3974014282226563
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,6144,16384,2,8,1,8,balanced,2.4237759908040366
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,6144,16384,2,8,1,8,balanced,0.14778133233388266
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,6144,16384,2,8,1,8,power_law_1.01,0.2282560110092163
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,4096,14336,2,8,8,1,power_law_1.2,5.389446258544922
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,6144,16384,2,8,1,8,balanced,0.14814933141072592
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,6144,16384,2,8,1,8,power_law_1.01,0.29144959449768065
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,6144,16384,2,8,1,8,balanced,0.11752000451087952
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,6144,16384,2,8,1,8,balanced,0.18660267194112143
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,6144,16384,2,8,1,8,power_law_1.01,0.33729279041290283
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,4096,14336,2,8,8,1,power_law_1.2,10.681388854980469
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,6144,16384,2,8,1,8,balanced,3.097418785095215
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,6144,16384,2,8,1,8,balanced,0.11752532919247945
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,6144,16384,2,8,1,8,balanced,0.17351466417312622
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,6144,16384,2,8,1,8,power_law_1.01,0.3750463962554932
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,6144,16384,2,8,1,8,power_law_1.01,0.4052608013153076
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,6144,16384,2,8,1,8,balanced,0.2739413380622864
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,6144,16384,2,8,1,8,power_law_1.01,0.4978943824768066
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,6144,16384,2,8,1,8,balanced,0.28722665707270306
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,6144,16384,2,8,1,8,balanced,3.8832321166992188
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,6144,16384,2,8,1,8,power_law_1.01,0.579641580581665
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,6144,16384,2,8,1,8,balanced,0.448794682820638
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,6144,16384,2,8,1,8,power_law_1.01,0.4615744113922119
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,6144,16384,2,8,1,8,balanced,0.11583999792734782
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,6144,16384,2,8,1,8,balanced,0.5332373380661011
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,6144,16384,2,8,1,8,power_law_1.01,0.5756608009338379
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,6144,16384,2,8,1,8,balanced,0.11743467052777608
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,6144,16384,2,8,1,8,balanced,0.7761653264363607
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,6144,16384,2,8,1,8,power_law_1.01,0.7876927852630615
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,6144,16384,2,8,1,8,balanced,6.3551896413167315
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,6144,16384,2,8,1,8,balanced,0.11938132842381795
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,6144,16384,2,8,1,8,power_law_1.01,1.0084287643432617
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,6144,16384,2,8,1,8,balanced,0.12019733587900798
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,6144,16384,2,8,1,8,balanced,0.9409600098927816
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,6144,16384,2,8,1,8,power_law_1.01,1.429868793487549
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,6144,16384,2,8,1,8,power_law_1.01,2.134592056274414
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,6144,16384,2,8,1,8,balanced,1.4302934010823567
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,6144,16384,2,8,1,8,power_law_1.01,3.0815935134887695
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,6144,16384,2,8,1,8,power_law_1.01,4.493862533569336
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,6144,16384,2,8,1,8,balanced,1.83515199025472
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,6144,16384,2,8,1,8,balanced,0.13318399588267008
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,6144,16384,2,8,1,8,balanced,0.13578133781750998
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,6144,16384,2,8,1,8,power_law_1.01,0.11237119436264038
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,6144,16384,2,8,1,8,power_law_1.01,6.570047760009766
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,6144,16384,2,8,1,8,balanced,12.474756876627604
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,6144,16384,2,8,1,8,balanced,0.1400213340918223
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,6144,16384,2,8,1,8,power_law_1.01,0.1047104001045227
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,6144,16384,2,8,1,8,power_law_1.01,8.569625854492188
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,6144,16384,2,8,1,8,balanced,2.3089493115743003
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,6144,16384,2,8,1,8,power_law_1.01,0.1041856050491333
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,6144,16384,2,8,1,8,power_law_1.01,0.1074112057685852
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,6144,16384,2,8,1,8,power_law_1.01,11.999820709228516
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,6144,16384,2,8,1,8,balanced,0.1850186586380005
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,6144,16384,2,8,1,8,power_law_1.01,0.10771839618682862
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,6144,16384,2,8,1,8,balanced,0.19275200366973877
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,6144,16384,2,8,1,8,power_law_1.01,0.11697280406951904
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,6144,16384,2,8,1,8,power_law_1.01,15.489132690429688
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,6144,16384,2,8,1,8,balanced,3.607402801513672
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,6144,16384,2,8,1,8,power_law_1.01,0.1471295952796936
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,6144,16384,2,8,1,8,power_law_1.01,0.1297152042388916
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,6144,16384,2,8,1,8,power_law_1.01,24.146138000488282
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,6144,16384,2,8,1,8,balanced,0.28087466955184937
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,6144,16384,2,8,1,8,power_law_1.01,0.15821440219879152
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,6144,16384,2,8,1,8,balanced,0.35069866975148517
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,6144,16384,2,8,1,8,power_law_1.01,0.16323839426040648
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,6144,16384,2,8,1,8,power_law_1.01,0.10871679782867431
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,6144,16384,2,8,1,8,power_law_1.01,0.1378559947013855
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,6144,16384,2,8,1,8,balanced,0.5452266534169515
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,6144,16384,2,8,1,8,power_law_1.01,0.10198400020599366
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,6144,16384,2,8,1,8,power_law_1.01,0.16298240423202515
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,6144,16384,2,8,1,8,power_law_1.01,48.31678771972656
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,6144,16384,2,8,1,8,power_law_1.01,0.10228480100631714
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,6144,16384,2,8,1,8,power_law_1.01,0.17418240308761596
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,6144,16384,2,8,1,8,balanced,0.6253600120544434
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,6144,16384,2,8,1,8,balanced,7.251845041910808
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,6144,16384,2,8,1,8,power_law_1.01,0.10613119602203369
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,6144,16384,2,8,1,8,power_law_1.2,0.16815999746322632
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,6144,16384,2,8,1,8,power_law_1.01,0.21118719577789308
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,6144,16384,2,8,1,8,power_law_1.01,0.10670080184936523
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,6144,16384,2,8,1,8,power_law_1.2,0.172326397895813
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,6144,16384,2,8,1,8,power_law_1.01,0.263372802734375
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,6144,16384,2,8,1,8,power_law_1.2,0.1708799958229065
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,6144,16384,2,8,1,8,power_law_1.01,0.13201279640197755
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,6144,16384,2,8,1,8,power_law_1.01,0.3061376094818115
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,6144,16384,2,8,1,8,power_law_1.2,0.16951680183410645
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,6144,16384,2,8,1,8,power_law_1.01,0.16082559823989867
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,6144,16384,2,8,1,8,power_law_1.2,0.16815359592437745
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,6144,16384,2,8,1,8,power_law_1.01,0.2941312074661255
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,6144,16384,2,8,1,8,balanced,0.9629226525624593
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,6144,16384,2,8,1,8,power_law_1.2,0.18663040399551392
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,6144,16384,2,8,1,8,power_law_1.01,0.1774783968925476
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,6144,16384,2,8,1,8,power_law_1.2,0.23033599853515624
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,6144,16384,2,8,1,8,power_law_1.01,0.42441601753234864
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,6144,16384,2,8,1,8,power_law_1.2,0.19861119985580444
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,6144,16384,2,8,1,8,balanced,1.2202026844024658
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,6144,16384,2,8,1,8,power_law_1.01,0.4437119960784912
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,6144,16384,2,8,1,8,power_law_1.2,0.24270079135894776
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,6144,16384,2,8,1,8,power_law_1.01,0.17246079444885254
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,6144,16384,2,8,1,8,power_law_1.2,0.257094407081604
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,6144,16384,2,8,1,8,power_law_1.01,0.6563392162322998
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,6144,16384,2,8,1,8,power_law_1.2,0.3182015895843506
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,6144,16384,2,8,1,8,power_law_1.01,0.19385600090026855
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,6144,16384,2,8,1,8,power_law_1.01,0.8147711753845215
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,6144,16384,2,8,1,8,power_law_1.2,0.35980160236358644
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,6144,16384,2,8,1,8,balanced,1.8079840342203777
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,6144,16384,2,8,1,8,power_law_1.2,0.4188543796539307
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,6144,16384,2,8,1,8,power_law_1.01,1.1922944068908692
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,6144,16384,2,8,1,8,power_law_1.2,0.3997056007385254
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,6144,16384,2,8,1,8,power_law_1.2,0.5661375999450684
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,6144,16384,2,8,1,8,power_law_1.01,0.16440320014953613
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,6144,16384,2,8,1,8,power_law_1.01,1.677894401550293
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,6144,16384,2,8,1,8,power_law_1.2,0.6186944007873535
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,6144,16384,2,8,1,8,balanced,2.3971306482950845
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,6144,16384,2,8,1,8,power_law_1.01,0.18516479730606078
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,6144,16384,2,8,1,8,power_law_1.2,0.4597760200500488
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,6144,16384,2,8,1,8,power_law_1.01,2.39803524017334
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,6144,16384,2,8,1,8,power_law_1.01,0.19604480266571045
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,6144,16384,2,8,1,8,power_law_1.2,0.6244031906127929
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,6144,16384,2,8,1,8,power_law_1.01,3.2837249755859377
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,6144,16384,2,8,1,8,power_law_1.2,0.7835391998291016
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,6144,16384,2,8,1,8,power_law_1.01,0.24138240814208983
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,6144,16384,2,8,1,8,balanced,2.9766613642374673
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,6144,16384,2,8,1,8,power_law_1.01,4.193446350097656
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,6144,16384,2,8,1,8,power_law_1.2,1.1591103553771973
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,6144,16384,2,8,1,8,power_law_1.2,1.4204607963562013
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,6144,16384,2,8,1,8,power_law_1.01,6.425376129150391
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,6144,16384,2,8,1,8,power_law_1.2,2.0934463500976563
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,6144,16384,2,8,1,8,power_law_1.01,0.23802878856658935
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,6144,16384,2,8,1,8,power_law_1.2,3.060416030883789
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,6144,16384,2,8,1,8,power_law_1.01,8.0162109375
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,6144,16384,2,8,1,8,power_law_1.2,4.61962890625
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,6144,16384,2,8,1,8,power_law_1.01,0.2888704061508179
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,6144,16384,2,8,1,8,balanced,4.72374947865804
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,6144,16384,2,8,1,8,power_law_1.01,0.34846720695495603
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,6144,16384,2,8,1,8,power_law_1.2,6.476383972167969
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,6144,16384,2,8,1,8,power_law_1.01,13.853523254394531
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,6144,16384,2,8,1,8,power_law_1.2,11.009619140625
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,6144,16384,2,8,1,8,power_law_1.01,0.4723519802093506
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,6144,16384,2,8,1,8,power_law_1.2,11.774899291992188
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,6144,16384,2,8,1,8,power_law_1.01,0.7022655963897705
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,6144,16384,2,8,1,8,power_law_1.01,26.937503051757812
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,6144,16384,2,8,1,8,power_law_1.2,14.969395446777344
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,6144,16384,2,8,1,8,power_law_1.01,1.056390380859375
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,6144,16384,2,8,1,8,power_law_1.01,1.3556415557861328
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,6144,16384,2,8,1,8,power_law_1.2,25.775540161132813
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,6144,16384,2,8,1,8,power_law_1.01,2.0107263565063476
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,6144,16384,2,8,1,8,balanced,9.343807856241861
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,6144,16384,2,8,1,8,power_law_1.01,2.345702362060547
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,6144,16384,2,8,1,8,power_law_1.2,49.771609497070315
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,6144,16384,2,8,1,8,power_law_1.2,0.1078976035118103
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,6144,16384,2,8,1,8,power_law_1.01,3.806284713745117
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,6144,16384,2,8,1,8,power_law_1.2,0.10892800092697144
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,6144,16384,2,8,1,8,power_law_1.01,4.226655960083008
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,6144,16384,2,8,1,8,power_law_1.2,0.1072767972946167
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,6144,16384,2,8,1,8,power_law_1.2,0.10920319557189942
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,6144,16384,2,8,1,8,power_law_1.01,6.5504508972167965
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,6144,16384,2,8,1,8,power_law_1.2,0.10913280248641968
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,6144,16384,2,8,1,8,power_law_1.01,8.943679809570312
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,6144,16384,2,8,1,8,power_law_1.2,0.12986880540847778
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,6144,16384,2,8,1,8,power_law_1.2,0.1596735954284668
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,6144,16384,2,8,1,8,power_law_1.01,11.392205047607423
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,6144,16384,2,8,1,8,power_law_1.2,0.12604160308837892
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,6144,16384,2,8,1,8,power_law_1.2,0.14005759954452515
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,6144,16384,2,8,1,8,power_law_1.01,17.544985961914062
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,6144,16384,2,8,1,8,power_law_1.2,0.1821120023727417
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,6144,16384,2,8,1,8,power_law_1.2,0.13453439474105836
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,6144,16384,2,8,1,8,power_law_1.2,0.15100799798965453
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,6144,16384,2,8,1,8,power_law_1.2,0.16618239879608154
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,6144,16384,2,8,1,8,power_law_1.01,37.16380920410156
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,6144,16384,2,8,1,8,power_law_1.2,0.21251199245452881
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,6144,16384,2,8,1,8,power_law_1.2,0.24821760654449462
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,6144,16384,2,8,1,8,power_law_1.2,0.2954047918319702
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,6144,16384,2,8,1,8,power_law_1.2,0.10866559743881225
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,6144,16384,2,8,1,8,power_law_1.2,0.30379519462585447
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,6144,16384,2,8,1,8,power_law_1.2,0.10215679407119752
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,6144,16384,2,8,1,8,power_law_1.2,0.44980478286743164
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,6144,16384,2,8,1,8,power_law_1.2,0.1023103952407837
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,6144,16384,2,8,1,8,power_law_1.2,0.42552962303161623
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,6144,16384,2,8,1,8,power_law_1.2,0.10599679946899414
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,6144,16384,2,8,1,8,power_law_1.2,0.627129602432251
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,6144,16384,2,8,1,8,power_law_1.2,0.10663679838180543
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,6144,16384,2,8,1,8,power_law_1.2,0.85032958984375
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,6144,16384,2,8,1,8,power_law_1.2,0.12895359992980956
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,6144,16384,2,8,1,8,power_law_1.2,1.2951040267944336
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,6144,16384,2,8,1,8,power_law_1.2,0.17834880352020263
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,6144,16384,2,8,1,8,power_law_1.2,1.5598272323608398
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,6144,16384,2,8,1,8,power_law_1.2,0.18306560516357423
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,6144,16384,2,8,1,8,power_law_1.2,2.29935359954834
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,6144,16384,2,8,1,8,power_law_1.2,3.0460927963256834
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,6144,16384,2,8,1,8,power_law_1.2,0.18927359580993652
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,6144,16384,2,8,2,4,balanced,0.11437867085138957
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,6144,16384,2,8,1,8,power_law_1.2,4.849849700927734
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,6144,16384,2,8,2,4,balanced,0.0749013324578603
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,6144,16384,2,8,1,8,power_law_1.2,0.19274239540100097
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,6144,16384,2,8,2,4,balanced,0.09825066725413005
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,6144,16384,2,8,2,4,balanced,0.07051200171311696
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,6144,16384,2,8,1,8,power_law_1.2,6.746578979492187
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,6144,16384,2,8,2,4,balanced,0.17161067326863608
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,6144,16384,2,8,2,4,balanced,0.10631466905275981
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,6144,16384,2,8,2,4,balanced,0.16821332772572836
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,6144,16384,2,8,1,8,power_law_1.2,7.435238647460937
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,6144,16384,2,8,1,8,power_law_1.2,0.1651136040687561
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,6144,16384,2,8,2,4,balanced,0.10591466228167216
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,6144,16384,2,8,2,4,balanced,0.16837332646052042
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,6144,16384,2,8,1,8,power_law_1.2,0.20439040660858154
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,6144,16384,2,8,2,4,balanced,0.10551466544469197
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,6144,16384,2,8,2,4,balanced,0.16825066010157266
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,6144,16384,2,8,1,8,power_law_1.2,13.784243774414062
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,6144,16384,2,8,1,8,power_law_1.2,0.20545918941497804
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,6144,16384,2,8,2,4,balanced,0.10664533575375874
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,6144,16384,2,8,2,4,balanced,0.16856533288955688
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,6144,16384,2,8,1,8,power_law_1.2,0.27774078845977784
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,6144,16384,2,8,2,4,balanced,0.1687999963760376
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,6144,16384,2,8,2,4,balanced,0.10691199700037639
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,6144,16384,2,8,2,4,balanced,0.17626132567723593
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,6144,16384,2,8,1,8,power_law_1.2,27.647967529296874
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,6144,16384,2,8,2,4,balanced,0.10777599612871806
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,6144,16384,2,8,2,4,balanced,0.17754133542378744
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,6144,16384,2,8,2,4,balanced,0.10899200042088826
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,6144,16384,2,8,1,8,power_law_1.2,0.2399679899215698
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,6144,16384,2,8,2,4,balanced,0.18332266807556152
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,6144,16384,2,8,2,4,balanced,0.1144426663716634
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,6144,16384,2,8,2,4,balanced,0.18237332503000894
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,6144,16384,2,8,1,8,power_law_1.2,0.29091839790344237
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,6144,16384,2,8,2,4,balanced,0.11752000451087952
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,6144,16384,2,8,2,4,balanced,0.18436266978581747
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,6144,16384,2,8,1,8,power_law_1.2,0.3711872100830078
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,6144,16384,2,8,2,4,balanced,0.11830400427182515
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,6144,16384,2,8,2,4,balanced,0.1964906652768453
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,6144,16384,2,8,2,4,balanced,0.11993599931399028
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,6144,16384,2,8,1,8,power_law_1.2,0.4911935806274414
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,6144,16384,2,8,2,4,balanced,0.2130826711654663
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,6144,16384,2,8,2,4,balanced,0.1209279994169871
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,6144,16384,2,8,2,4,balanced,0.2139093279838562
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,6144,16384,2,8,1,8,power_law_1.2,0.6985919952392579
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,6144,16384,2,8,2,4,balanced,0.1404906709988912
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,6144,16384,2,8,2,4,balanced,0.2237173318862915
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,6144,16384,2,8,2,4,balanced,0.14120533068974814
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,6144,16384,2,8,1,8,power_law_1.2,0.9884544372558594
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,6144,16384,2,8,2,4,balanced,0.2754613359769185
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,6144,16384,2,8,2,4,balanced,0.1384266714255015
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,6144,16384,2,8,1,8,power_law_1.2,1.3577216148376465
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,6144,16384,2,8,2,4,balanced,0.2629706660906474
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,6144,16384,2,8,2,4,balanced,0.1691840092341105
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,6144,16384,2,8,1,8,power_law_1.2,2.093587112426758
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,6144,16384,2,8,2,4,balanced,0.4020800193150838
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,6144,16384,2,8,2,4,balanced,0.17709332704544067
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,6144,16384,2,8,1,8,power_law_1.2,2.313747215270996
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,6144,16384,2,8,2,4,balanced,0.4554239908854167
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,6144,16384,2,8,2,4,balanced,0.2592853307723999
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,6144,16384,2,8,2,4,balanced,0.6616053183873495
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,6144,16384,2,8,2,4,balanced,0.29796799023946124
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,6144,16384,2,8,1,8,power_law_1.2,2.8733055114746096
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,6144,16384,2,8,2,4,balanced,0.4219733476638794
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,6144,16384,2,8,2,4,balanced,0.7900426387786865
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,6144,16384,2,8,1,8,power_law_1.2,3.912793731689453
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,6144,16384,2,8,2,4,balanced,0.5113919973373413
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,6144,16384,2,8,2,4,balanced,1.1997973124186199
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,6144,16384,2,8,1,8,power_law_1.2,6.8924095153808596
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,6144,16384,2,8,2,4,balanced,0.7592480182647705
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,6144,16384,2,8,2,4,balanced,0.06342400113741557
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,6144,16384,2,8,2,4,balanced,1.5233759880065918
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,6144,16384,2,8,1,8,power_law_1.2,9.168863677978516
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,6144,16384,2,8,2,4,balanced,0.06294399996598561
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,6144,16384,2,8,2,4,balanced,0.9636159737904867
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,6144,16384,2,8,2,4,power_law_1.01,0.1608448028564453
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,6144,16384,2,8,2,4,power_law_1.01,0.09872000217437744
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,6144,16384,2,8,1,8,power_law_1.2,9.77232666015625
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,6144,16384,2,8,2,4,balanced,0.09872532884279887
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,6144,16384,2,8,2,4,balanced,2.285226662953695
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,6144,16384,2,8,2,4,power_law_1.01,0.1370303988456726
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,6144,16384,2,8,2,4,power_law_1.01,0.09807360172271729
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,6144,16384,2,8,2,4,balanced,0.10070932904879253
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,6144,16384,2,8,2,4,power_law_1.01,0.1571776032447815
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,6144,16384,2,8,2,4,balanced,1.4279146194458008
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,6144,16384,2,8,2,4,power_law_1.01,0.09896320104598999
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,6144,16384,2,8,2,4,balanced,0.10219732920328777
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,6144,16384,2,8,2,4,power_law_1.01,0.16815359592437745
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,6144,16384,2,8,1,8,power_law_1.2,16.913343811035155
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,6144,16384,2,8,2,4,power_law_1.01,0.16659200191497803
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,6144,16384,2,8,2,4,power_law_1.01,0.10588799715042115
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,6144,16384,2,8,2,4,balanced,0.10269332925478618
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,6144,16384,2,8,2,4,balanced,3.017909367879232
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,6144,16384,2,8,2,4,power_law_1.01,0.1799936056137085
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,6144,16384,2,8,2,4,power_law_1.01,0.10369280576705933
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,6144,16384,2,8,2,4,balanced,0.10511466860771179
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,6144,16384,2,8,2,4,power_law_1.01,0.19167360067367553
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,6144,16384,2,8,2,4,balanced,1.8801120122273762
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,6144,16384,2,8,2,4,power_law_1.01,0.1936959981918335
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,6144,16384,2,8,2,4,balanced,0.10500267148017883
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,6144,16384,2,8,2,4,power_law_1.01,0.11163519620895386
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,6144,16384,2,8,1,8,power_law_1.2,36.665835571289065
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,6144,16384,2,8,2,4,power_law_1.01,0.20663039684295653
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,6144,16384,2,8,2,4,power_law_1.01,0.21911039352416992
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,6144,16384,2,8,2,4,balanced,3.7741705576578775
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,6144,16384,2,8,2,4,power_law_1.01,0.12281600236892701
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,6144,16384,2,8,2,4,power_law_1.01,0.23487999439239501
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,6144,16384,2,8,2,4,balanced,2.318277359008789
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,6144,16384,2,8,2,4,power_law_1.01,0.11681920289993286
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,6144,16384,2,8,2,4,power_law_1.01,0.2705215930938721
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,6144,16384,2,8,2,4,power_law_1.01,0.26990718841552735
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,6144,16384,2,8,2,4,power_law_1.01,0.12879999876022338
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,6144,16384,2,8,2,4,power_law_1.01,0.27888638973236085
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,6144,16384,2,8,2,4,balanced,0.10593600074450175
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,6144,16384,2,8,2,4,power_law_1.01,0.1338752031326294
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,6144,16384,2,8,2,4,power_law_1.01,0.3035583972930908
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,6144,16384,2,8,2,4,balanced,0.10724799831708272
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,6144,16384,2,8,2,4,power_law_1.01,0.13674880266189576
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,6144,16384,2,8,2,4,power_law_1.01,0.35122559070587156
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,6144,16384,2,8,2,4,balanced,6.154282887776692
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,6144,16384,2,8,2,4,power_law_1.01,0.29252479076385496
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,6144,16384,2,8,2,4,balanced,3.8315518697102866
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,6144,16384,2,8,2,4,power_law_1.01,0.14608639478683472
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,6144,16384,2,8,2,4,power_law_1.01,0.4491392135620117
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,6144,16384,2,8,2,4,power_law_1.01,0.14947839975357055
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,6144,16384,2,8,2,4,power_law_1.01,0.5849408149719239
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,6144,16384,2,8,2,4,power_law_1.01,0.08925439715385437
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,6144,16384,2,8,2,4,power_law_1.01,0.7941120147705079
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,6144,16384,2,8,2,4,power_law_1.01,0.17493760585784912
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,6144,16384,2,8,2,4,power_law_1.01,0.0762112021446228
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,6144,16384,2,8,2,4,power_law_1.01,1.2821248054504395
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,6144,16384,2,8,2,4,power_law_1.01,0.21456639766693114
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,6144,16384,2,8,2,4,power_law_1.01,0.08316799998283386
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,6144,16384,2,8,2,4,power_law_1.01,1.4705984115600585
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,6144,16384,2,8,2,4,power_law_1.01,0.2320319890975952
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,6144,16384,2,8,2,4,power_law_1.01,0.1013375997543335
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,6144,16384,2,8,2,4,power_law_1.01,1.8618175506591796
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,6144,16384,2,8,2,4,power_law_1.01,0.2458048105239868
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,6144,16384,2,8,2,4,balanced,0.11062933007876079
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,6144,16384,2,8,2,4,power_law_1.01,0.10201599597930908
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,6144,16384,2,8,2,4,power_law_1.01,0.3426815986633301
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,6144,16384,2,8,2,4,power_law_1.01,3.2863487243652343
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,6144,16384,2,8,2,4,balanced,0.1125386655330658
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,6144,16384,2,8,2,4,power_law_1.01,0.12465280294418335
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,6144,16384,2,8,2,4,power_law_1.01,0.3249216079711914
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,6144,16384,2,8,2,4,balanced,12.440831502278646
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,6144,16384,2,8,2,4,balanced,7.48634147644043
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,6144,16384,2,8,2,4,power_law_1.01,4.082131195068359
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,6144,16384,2,8,2,4,power_law_1.01,0.13055360317230225
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,6144,16384,2,8,2,4,balanced,0.11520000298817952
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,6144,16384,2,8,2,4,power_law_1.01,0.49470720291137693
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,6144,16384,2,8,2,4,power_law_1.01,0.1394047975540161
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,6144,16384,2,8,2,4,power_law_1.01,5.910406494140625
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,6144,16384,2,8,2,4,balanced,0.11642133196194966
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,6144,16384,2,8,2,4,power_law_1.01,0.5894400119781494
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,6144,16384,2,8,2,4,power_law_1.01,0.9808896064758301
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,6144,16384,2,8,2,4,power_law_1.01,8.494918060302734
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,6144,16384,2,8,2,4,power_law_1.01,0.15239039659500123
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,6144,16384,2,8,2,4,power_law_1.01,1.1803903579711914
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,6144,16384,2,8,2,4,power_law_1.01,0.15127040147781373
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,6144,16384,2,8,2,4,power_law_1.01,12.985031127929688
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,6144,16384,2,8,2,4,power_law_1.01,1.7077247619628906
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,6144,16384,2,8,2,4,balanced,0.1285706659158071
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,6144,16384,2,8,2,4,power_law_1.01,1.9740415573120118
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,6144,16384,2,8,2,4,power_law_1.01,16.05473937988281
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,6144,16384,2,8,2,4,balanced,0.13166933258374533
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,6144,16384,2,8,2,4,power_law_1.01,0.1367743968963623
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,6144,16384,2,8,2,4,power_law_1.01,0.145196795463562
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,6144,16384,2,8,2,4,power_law_1.01,3.5368961334228515
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,6144,16384,2,8,2,4,balanced,0.13687466581662497
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,6144,16384,2,8,2,4,power_law_1.01,0.15253759622573854
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,6144,16384,2,8,2,4,balanced,0.19291732708613077
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,6144,16384,2,8,2,4,power_law_1.01,4.9158782958984375
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,6144,16384,2,8,2,4,power_law_1.01,0.17807999849319459
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,6144,16384,2,8,2,4,power_law_1.01,31.21180114746094
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,6144,16384,2,8,2,4,balanced,0.20246932903925577
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,6144,16384,2,8,2,4,power_law_1.01,6.009203338623047
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,6144,16384,2,8,2,4,power_law_1.01,0.1818560004234314
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,6144,16384,2,8,2,4,power_law_1.01,0.1884608030319214
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,6144,16384,2,8,2,4,balanced,0.28674133618672687
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,6144,16384,2,8,2,4,power_law_1.01,8.872025299072266
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,6144,16384,2,8,2,4,power_law_1.01,0.26917760372161864
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,6144,16384,2,8,2,4,balanced,0.37409067153930664
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,6144,16384,2,8,2,4,power_law_1.01,0.3741568088531494
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,6144,16384,2,8,2,4,power_law_1.01,21.760243225097657
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,6144,16384,2,8,2,4,power_law_1.01,0.3978368043899536
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,6144,16384,2,8,2,4,power_law_1.01,0.73537278175354
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,6144,16384,2,8,2,4,power_law_1.01,0.9381695747375488
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,6144,16384,2,8,2,4,balanced,0.5714826583862305
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,6144,16384,2,8,2,4,power_law_1.01,1.207968044281006
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,6144,16384,2,8,2,4,balanced,0.7550400098164877
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,6144,16384,2,8,2,4,power_law_1.01,1.519200038909912
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,6144,16384,2,8,2,4,balanced,1.1599679787953694
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,6144,16384,2,8,2,4,power_law_1.2,0.17415679693222047
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,6144,16384,2,8,2,4,power_law_1.01,2.4257856369018556
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,6144,16384,2,8,2,4,power_law_1.01,4.073619079589844
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,6144,16384,2,8,2,4,power_law_1.2,0.1505087971687317
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,6144,16384,2,8,2,4,balanced,1.5235625902811687
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,6144,16384,2,8,2,4,power_law_1.01,6.801395416259766
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,6144,16384,2,8,2,4,power_law_1.2,0.1435968041419983
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,6144,16384,2,8,2,4,power_law_1.01,7.922406768798828
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,6144,16384,2,8,2,4,power_law_1.2,0.1677248001098633
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,6144,16384,2,8,2,4,balanced,2.273599942525228
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,6144,16384,2,8,2,4,power_law_1.01,7.923948669433594
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,6144,16384,2,8,2,4,power_law_1.2,0.16714880466461182
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,6144,16384,2,8,2,4,power_law_1.2,0.18921600580215453
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,6144,16384,2,8,2,4,power_law_1.01,17.818048095703126
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,6144,16384,2,8,2,4,power_law_1.2,0.1928447961807251
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,6144,16384,2,8,2,4,balanced,3.0080159505208335
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,6144,16384,2,8,2,4,power_law_1.2,0.1919808030128479
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,6144,16384,2,8,2,4,power_law_1.01,36.434906005859375
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,6144,16384,2,8,2,4,power_law_1.2,0.21191039085388183
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,6144,16384,2,8,2,4,power_law_1.2,0.21056001186370848
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,6144,16384,2,8,2,4,balanced,3.7615038553873696
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,6144,16384,2,8,2,4,power_law_1.2,0.23392000198364257
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,6144,16384,2,8,2,4,power_law_1.2,0.27672319412231444
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,6144,16384,2,8,2,4,power_law_1.2,0.30189440250396726
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,6144,16384,2,8,2,4,power_law_1.2,0.30138239860534666
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,6144,16384,2,8,2,4,balanced,6.032378514607747
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,6144,16384,2,8,2,4,power_law_1.2,0.3425280094146729
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,6144,16384,2,8,2,4,power_law_1.2,0.3181567907333374
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,6144,16384,2,8,2,4,power_law_1.2,0.4235519886016846
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,6144,16384,2,8,2,4,power_law_1.2,0.4448063850402832
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,6144,16384,2,8,2,4,power_law_1.2,0.5399168014526368
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,6144,16384,2,8,2,4,power_law_1.2,0.8825535774230957
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,6144,16384,2,8,2,4,power_law_1.2,0.09887359738349914
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,6144,16384,2,8,2,4,power_law_1.2,1.0297856330871582
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,6144,16384,2,8,2,4,balanced,11.994949340820312
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,6144,16384,2,8,2,4,power_law_1.2,1.3215423583984376
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,6144,16384,2,8,2,4,power_law_1.2,0.09905279874801635
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,6144,16384,2,8,2,4,power_law_1.2,0.09127680063247681
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,6144,16384,2,8,2,4,power_law_1.2,2.178783988952637
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,6144,16384,2,8,2,4,power_law_1.2,0.10538239479064941
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,6144,16384,2,8,2,4,power_law_1.2,3.777036666870117
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,6144,16384,2,8,2,4,power_law_1.2,0.10454399585723877
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,6144,16384,2,8,2,4,power_law_1.2,4.8831230163574215
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,6144,16384,2,8,2,4,power_law_1.2,0.1109120011329651
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,6144,16384,2,8,2,4,power_law_1.2,6.973107147216797
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,6144,16384,2,8,2,4,power_law_1.2,0.12033280134201049
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,6144,16384,2,8,2,4,power_law_1.2,0.11957759857177734
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,6144,16384,2,8,2,4,power_law_1.2,7.699282836914063
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,6144,16384,2,8,2,4,power_law_1.2,0.1338495969772339
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,6144,16384,2,8,2,4,power_law_1.2,9.609855651855469
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,6144,16384,2,8,2,4,power_law_1.2,0.13067519664764404
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,6144,16384,2,8,2,4,power_law_1.2,0.13239680528640746
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,6144,16384,2,8,2,4,power_law_1.2,17.351718139648437
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,6144,16384,2,8,2,4,power_law_1.2,0.14712320566177367
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,6144,16384,2,8,2,4,power_law_1.2,0.16161279678344725
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,6144,16384,2,8,2,4,power_law_1.2,0.18557440042495726
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,6144,16384,2,8,2,4,power_law_1.2,0.2137216091156006
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,6144,16384,2,8,2,4,power_law_1.2,33.9984375
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,6144,16384,2,8,2,4,power_law_1.2,0.25095040798187257
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,6144,16384,2,8,4,2,balanced,0.0710346649090449
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,6144,16384,2,8,2,4,power_law_1.2,0.2453696012496948
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,6144,16384,2,8,2,4,power_law_1.2,0.08883839845657349
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,6144,16384,2,8,4,2,balanced,0.09775466720263164
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,6144,16384,2,8,2,4,power_law_1.2,0.3555327892303467
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,6144,16384,2,8,2,4,power_law_1.2,0.09098880290985108
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,6144,16384,2,8,4,2,balanced,0.16402133305867514
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,6144,16384,2,8,2,4,power_law_1.2,0.3268671989440918
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,6144,16384,2,8,2,4,power_law_1.2,0.07649919986724854
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,6144,16384,2,8,4,2,balanced,0.16710400581359863
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,6144,16384,2,8,2,4,power_law_1.2,0.45706877708435056
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,6144,16384,2,8,2,4,power_law_1.2,0.10114560127258301
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,6144,16384,2,8,4,2,balanced,0.16525333126386008
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,6144,16384,2,8,4,2,balanced,0.05012799799442291
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,6144,16384,2,8,2,4,power_law_1.2,0.7087679862976074
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,6144,16384,2,8,2,4,power_law_1.2,0.10065280199050904
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,6144,16384,2,8,4,2,balanced,0.16771199305852255
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,6144,16384,2,8,2,4,power_law_1.2,0.9627455711364746
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,6144,16384,2,8,4,2,balanced,0.06541866560777028
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,6144,16384,2,8,2,4,power_law_1.2,0.12119040489196778
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,6144,16384,2,8,4,2,balanced,0.16768532991409302
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,6144,16384,2,8,4,2,balanced,0.09941866993904114
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,6144,16384,2,8,2,4,power_law_1.2,1.2702655792236328
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,6144,16384,2,8,2,4,power_law_1.2,0.12826240062713623
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,6144,16384,2,8,4,2,balanced,0.1684160033861796
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,6144,16384,2,8,4,2,balanced,0.10241599877675374
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,6144,16384,2,8,2,4,power_law_1.2,2.2723392486572265
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,6144,16384,2,8,2,4,power_law_1.2,0.14841599464416505
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,6144,16384,2,8,4,2,balanced,0.17390400171279907
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,6144,16384,2,8,4,2,balanced,0.10379733641942342
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,6144,16384,2,8,2,4,power_law_1.2,2.673702430725098
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,6144,16384,2,8,4,2,balanced,0.10435199737548828
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,6144,16384,2,8,4,2,balanced,0.17538666725158691
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,6144,16384,2,8,2,4,power_law_1.2,3.843859100341797
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,6144,16384,2,8,2,4,power_law_1.2,0.1411967992782593
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,6144,16384,2,8,4,2,balanced,0.10578667124112447
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,6144,16384,2,8,4,2,balanced,0.17995200554529825
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,6144,16384,2,8,2,4,power_law_1.2,6.1253822326660154
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,6144,16384,2,8,2,4,power_law_1.2,0.1558784008026123
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,6144,16384,2,8,4,2,balanced,0.18370133638381958
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,6144,16384,2,8,4,2,balanced,0.10782399773597717
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,6144,16384,2,8,4,2,balanced,0.18577067057291666
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,6144,16384,2,8,4,2,balanced,0.10771200060844421
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,6144,16384,2,8,2,4,power_law_1.2,7.234086608886718
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,6144,16384,2,8,4,2,balanced,0.108815997838974
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,6144,16384,2,8,4,2,balanced,0.1925013264020284
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,6144,16384,2,8,2,4,power_law_1.2,0.14207359552383422
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,6144,16384,2,8,2,4,power_law_1.2,9.184716796875
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,6144,16384,2,8,4,2,balanced,0.1125920017560323
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,6144,16384,2,8,4,2,balanced,0.19844800233840942
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,6144,16384,2,8,2,4,power_law_1.2,0.14629119634628296
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,6144,16384,2,8,4,2,balanced,0.11306132872899373
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,6144,16384,2,8,4,2,balanced,0.2006453275680542
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,6144,16384,2,8,2,4,power_law_1.2,0.15256960391998292
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,6144,16384,2,8,4,2,balanced,0.11524800459543864
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,6144,16384,2,8,2,4,power_law_1.2,19.307090759277344
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,6144,16384,2,8,4,2,balanced,0.2456159989039103
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,6144,16384,2,8,2,4,power_law_1.2,0.17844480276107788
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,6144,16384,2,8,4,2,balanced,0.12251733740170796
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,6144,16384,2,8,4,2,balanced,0.04496533175309499
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,6144,16384,2,8,4,2,balanced,0.26841066281000775
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,6144,16384,2,8,4,2,balanced,0.13121599952379862
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,6144,16384,2,8,4,2,balanced,0.2818933327992757
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,6144,16384,2,8,4,2,balanced,0.06076266864935557
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,6144,16384,2,8,2,4,power_law_1.2,0.19696639776229857
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,6144,16384,2,8,4,2,balanced,0.13343999783198038
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,6144,16384,2,8,4,2,balanced,0.09610666831334432
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,6144,16384,2,8,4,2,balanced,0.3803413311640422
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,6144,16384,2,8,2,4,power_law_1.2,0.21971840858459474
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,6144,16384,2,8,4,2,balanced,0.1569706698258718
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,6144,16384,2,8,4,2,balanced,0.09914666414260864
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,6144,16384,2,8,4,2,balanced,0.4396586815516154
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,6144,16384,2,8,2,4,power_law_1.2,0.2858304023742676
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,6144,16384,2,8,4,2,balanced,0.17698667446772257
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,6144,16384,2,8,4,2,balanced,0.09991466999053955
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,6144,16384,2,8,2,4,power_law_1.2,0.36842238903045654
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,6144,16384,2,8,4,2,balanced,0.6470239957173666
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,6144,16384,2,8,4,2,balanced,0.18905067443847656
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,6144,16384,2,8,4,2,balanced,0.10207999746004741
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,6144,16384,2,8,4,2,power_law_1.01,0.09168000221252441
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,6144,16384,2,8,2,4,power_law_1.2,0.5601280212402344
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,6144,16384,2,8,4,2,balanced,0.8200746377309164
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,6144,16384,2,8,4,2,balanced,0.2545119921366374
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,6144,16384,2,8,4,2,balanced,0.10408000151316325
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,6144,16384,2,8,4,2,power_law_1.01,0.08743039965629577
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,6144,16384,2,8,2,4,power_law_1.2,0.8932415962219238
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,6144,16384,2,8,4,2,balanced,0.2961706717809041
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,6144,16384,2,8,4,2,power_law_1.01,0.11802879571914673
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,6144,16384,2,8,4,2,balanced,1.1997013092041016
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,6144,16384,2,8,4,2,balanced,0.10325866937637329
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,6144,16384,2,8,2,4,power_law_1.2,1.1276864051818847
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,6144,16384,2,8,4,2,power_law_1.01,0.16563839912414552
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,6144,16384,2,8,4,2,balanced,0.42795733610788983
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,6144,16384,2,8,4,2,power_law_1.01,0.1606592059135437
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,6144,16384,2,8,4,2,power_law_1.01,0.16855039596557617
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,6144,16384,2,8,4,2,balanced,1.5747146606445312
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,6144,16384,2,8,2,4,power_law_1.2,1.8180095672607421
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,6144,16384,2,8,4,2,balanced,0.5433760086695353
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,6144,16384,2,8,4,2,power_law_1.01,0.1793023943901062
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,6144,16384,2,8,4,2,power_law_1.01,0.17418880462646485
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,6144,16384,2,8,2,4,power_law_1.2,2.2564992904663086
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,6144,16384,2,8,4,2,power_law_1.01,0.19026559591293335
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,6144,16384,2,8,4,2,balanced,0.7852106889088949
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,6144,16384,2,8,4,2,balanced,2.350671927134196
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,6144,16384,2,8,4,2,balanced,0.10646933317184448
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,6144,16384,2,8,2,4,power_law_1.2,3.588326263427734
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,6144,16384,2,8,4,2,power_law_1.01,0.21685121059417725
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,6144,16384,2,8,4,2,power_law_1.01,0.21548159122467042
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,6144,16384,2,8,4,2,balanced,0.10777067144711812
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,6144,16384,2,8,4,2,balanced,1.0260213216145833
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,6144,16384,2,8,2,4,power_law_1.2,5.461830520629883
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,6144,16384,2,8,4,2,power_law_1.01,0.24362239837646485
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,6144,16384,2,8,4,2,power_law_1.01,0.24427518844604493
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,6144,16384,2,8,4,2,balanced,3.136005401611328
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,6144,16384,2,8,2,4,power_law_1.2,6.333324813842774
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,6144,16384,2,8,4,2,power_law_1.01,0.2397183895111084
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,6144,16384,2,8,4,2,balanced,1.4992319742838542
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,6144,16384,2,8,4,2,power_law_1.01,0.27983999252319336
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,6144,16384,2,8,2,4,power_law_1.2,9.187187194824219
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,6144,16384,2,8,4,2,power_law_1.01,0.28048000335693357
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,6144,16384,2,8,4,2,power_law_1.01,0.3380928039550781
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,6144,16384,2,8,4,2,balanced,3.8749281565348306
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,6144,16384,2,8,4,2,power_law_1.01,0.4332287788391113
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,6144,16384,2,8,2,4,power_law_1.2,10.423212432861328
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,6144,16384,2,8,4,2,balanced,2.025989373524984
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,6144,16384,2,8,4,2,power_law_1.01,0.40622720718383787
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,6144,16384,2,8,4,2,power_law_1.01,0.5563072204589844
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,6144,16384,2,8,4,2,balanced,0.11111467083295186
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,6144,16384,2,8,4,2,power_law_1.01,0.6540736198425293
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,6144,16384,2,8,2,4,power_law_1.2,20.207437133789064
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,6144,16384,2,8,4,2,balanced,0.11428800225257874
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,6144,16384,2,8,4,2,power_law_1.01,0.9649663925170898
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,6144,16384,2,8,4,2,power_law_1.01,1.441420841217041
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,6144,16384,2,8,4,2,balanced,2.4893760681152344
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,6144,16384,2,8,4,2,power_law_1.01,0.0695360004901886
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,6144,16384,2,8,4,2,balanced,0.11785067121187846
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,6144,16384,2,8,4,2,power_law_1.01,1.8887104034423827
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,6144,16384,2,8,4,2,balanced,6.139781316121419
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,6144,16384,2,8,4,2,balanced,0.12006933490435283
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,6144,16384,2,8,4,2,power_law_1.01,0.07677440047264099
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,6144,16384,2,8,4,2,power_law_1.01,2.7626880645751952
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,6144,16384,2,8,2,4,power_law_1.2,40.50550537109375
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,6144,16384,2,8,4,2,power_law_1.01,0.08280959725379944
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,6144,16384,2,8,4,2,power_law_1.01,4.25274887084961
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,6144,16384,2,8,4,2,power_law_1.01,0.10130560398101807
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,6144,16384,2,8,4,2,power_law_1.01,5.442323303222656
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,6144,16384,2,8,4,2,balanced,3.887200037638346
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,6144,16384,2,8,4,2,power_law_1.01,0.10197759866714477
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,6144,16384,2,8,4,2,power_law_1.01,5.477459335327149
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,6144,16384,2,8,4,2,balanced,0.13542399803797403
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,6144,16384,2,8,4,2,power_law_1.01,0.10737279653549195
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,6144,16384,2,8,4,2,balanced,0.14036267002423605
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,6144,16384,2,8,4,2,power_law_1.01,10.891289520263673
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,6144,16384,2,8,4,2,power_law_1.01,0.11607680320739747
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,6144,16384,2,8,4,2,balanced,0.1476693352063497
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,6144,16384,2,8,4,2,power_law_1.01,0.1103935956954956
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,6144,16384,2,8,4,2,power_law_1.01,19.05467529296875
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,6144,16384,2,8,4,2,balanced,0.20683733622233072
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,6144,16384,2,8,4,2,balanced,12.617226918538412
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,6144,16384,2,8,4,2,power_law_1.01,0.11722240447998047
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,6144,16384,2,8,4,2,balanced,0.2213546633720398
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,6144,16384,2,8,4,2,power_law_1.01,0.11575039625167846
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,6144,16384,2,8,4,2,power_law_1.01,0.11907199621200562
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,6144,16384,2,8,4,2,balanced,7.720111846923828
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,6144,16384,2,8,4,2,power_law_1.01,0.13248000144958497
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,6144,16384,2,8,4,2,balanced,0.3163573344548543
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,6144,16384,2,8,4,2,power_law_1.01,0.12839679718017577
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,6144,16384,2,8,4,2,power_law_1.01,0.154367995262146
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,6144,16384,2,8,4,2,balanced,0.4230293432871501
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,6144,16384,2,8,4,2,power_law_1.01,0.17424000501632692
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,6144,16384,2,8,4,2,balanced,0.6454079945882162
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,6144,16384,2,8,4,2,power_law_1.01,0.1740928053855896
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,6144,16384,2,8,4,2,power_law_1.01,0.05676159858703613
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,6144,16384,2,8,4,2,balanced,0.8538613319396973
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,6144,16384,2,8,4,2,power_law_1.01,0.20515840053558348
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,6144,16384,2,8,4,2,power_law_1.01,0.07067520022392274
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,6144,16384,2,8,4,2,power_law_1.01,0.242905592918396
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,6144,16384,2,8,4,2,power_law_1.01,0.07020800113677979
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,6144,16384,2,8,4,2,balanced,1.2921600341796875
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,6144,16384,2,8,4,2,power_law_1.01,0.28846719264984133
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,6144,16384,2,8,4,2,power_law_1.01,0.09994239807128906
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,6144,16384,2,8,4,2,power_law_1.01,0.3309567928314209
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,6144,16384,2,8,4,2,power_law_1.01,0.10098559856414795
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,6144,16384,2,8,4,2,balanced,1.6939733823140461
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,6144,16384,2,8,4,2,power_law_1.01,0.47535362243652346
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,6144,16384,2,8,4,2,power_law_1.01,0.10911999940872193
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,6144,16384,2,8,4,2,power_law_1.01,0.12177920341491699
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,6144,16384,2,8,4,2,power_law_1.01,0.6357183933258057
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,6144,16384,2,8,4,2,balanced,2.5203359921773276
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,6144,16384,2,8,4,2,power_law_1.01,0.12479360103607177
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,6144,16384,2,8,4,2,power_law_1.01,0.814412784576416
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,6144,16384,2,8,4,2,power_law_1.01,1.1858495712280273
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,6144,16384,2,8,4,2,balanced,3.3551200230916343
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,6144,16384,2,8,4,2,power_law_1.01,1.3706175804138183
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,6144,16384,2,8,4,2,power_law_1.01,0.12947200536727904
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,6144,16384,2,8,4,2,power_law_1.01,0.13404799699783326
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,6144,16384,2,8,4,2,power_law_1.01,1.9754688262939453
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,6144,16384,2,8,4,2,power_law_1.01,3.165305519104004
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,6144,16384,2,8,4,2,balanced,4.180335998535156
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,6144,16384,2,8,4,2,power_law_1.01,3.8170238494873048
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,6144,16384,2,8,4,2,power_law_1.01,0.1284608006477356
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,6144,16384,2,8,4,2,power_law_1.01,0.1344704031944275
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,6144,16384,2,8,4,2,power_law_1.01,6.4186561584472654
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,6144,16384,2,8,4,2,power_law_1.01,0.14209920167922974
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,6144,16384,2,8,4,2,balanced,6.689525604248047
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,6144,16384,2,8,4,2,power_law_1.01,12.383033752441406
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,6144,16384,2,8,4,2,power_law_1.01,0.15507199764251708
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,6144,16384,2,8,4,2,power_law_1.2,0.09957759976387023
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,6144,16384,2,8,4,2,power_law_1.2,0.10402560234069824
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,6144,16384,2,8,4,2,power_law_1.01,0.181113600730896
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,6144,16384,2,8,4,2,power_law_1.2,0.11752320528030395
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,6144,16384,2,8,4,2,power_law_1.01,0.19119999408721924
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,6144,16384,2,8,4,2,power_law_1.2,0.1664191961288452
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,6144,16384,2,8,4,2,power_law_1.01,0.2254784107208252
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,6144,16384,2,8,4,2,power_law_1.2,0.16540160179138183
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,6144,16384,2,8,4,2,power_law_1.01,0.27679359912872314
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,6144,16384,2,8,4,2,power_law_1.2,0.1704319953918457
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,6144,16384,2,8,4,2,power_law_1.01,0.35530240535736085
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,6144,16384,2,8,4,2,balanced,13.512037913004557
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,6144,16384,2,8,4,2,power_law_1.2,0.18257280588150024
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,6144,16384,2,8,4,2,power_law_1.01,0.551206398010254
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,6144,16384,2,8,4,2,power_law_1.2,0.17799680233001708
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,6144,16384,2,8,4,2,power_law_1.01,0.7453311920166016
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,6144,16384,2,8,4,2,power_law_1.2,0.1865407943725586
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,6144,16384,2,8,4,2,power_law_1.01,0.9927295684814453
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,6144,16384,2,8,4,2,power_law_1.2,0.22055039405822754
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,6144,16384,2,8,4,2,power_law_1.01,1.3998720169067382
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,6144,16384,2,8,4,2,power_law_1.2,0.21495680809020995
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,6144,16384,2,8,4,2,power_law_1.01,2.1149503707885744
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,6144,16384,2,8,4,2,power_law_1.2,0.23573760986328124
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,6144,16384,2,8,4,2,power_law_1.01,2.837376022338867
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,6144,16384,2,8,4,2,power_law_1.2,0.24460160732269287
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,6144,16384,2,8,4,2,power_law_1.2,0.25386240482330324
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,6144,16384,2,8,4,2,power_law_1.01,3.4510974884033203
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,6144,16384,2,8,4,2,power_law_1.2,0.2734463930130005
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,6144,16384,2,8,4,2,power_law_1.01,5.0548351287841795
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,6144,16384,2,8,4,2,power_law_1.2,0.2837631940841675
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,6144,16384,2,8,4,2,power_law_1.2,0.3236736059188843
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,6144,16384,2,8,4,2,power_law_1.01,5.637337493896484
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,6144,16384,2,8,4,2,power_law_1.2,0.4248511791229248
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,6144,16384,2,8,4,2,power_law_1.01,9.94949722290039
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,6144,16384,2,8,4,2,power_law_1.2,0.46625919342041017
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,6144,16384,2,8,4,2,power_law_1.2,0.5494143962860107
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,6144,16384,2,8,4,2,power_law_1.2,0.7247744083404541
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,6144,16384,2,8,4,2,power_law_1.01,17.361383056640626
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,6144,16384,2,8,4,2,power_law_1.2,1.1498496055603027
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,6144,16384,2,8,4,2,power_law_1.2,1.4372032165527344
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,6144,16384,2,8,4,2,power_law_1.2,2.0299007415771486
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,6144,16384,2,8,4,2,power_law_1.2,2.361523246765137
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,6144,16384,2,8,4,2,power_law_1.2,4.073376083374024
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,6144,16384,2,8,4,2,power_law_1.2,0.0695039987564087
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,6144,16384,2,8,4,2,power_law_1.2,4.6943103790283205
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,6144,16384,2,8,4,2,power_law_1.2,0.06483839750289917
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,6144,16384,2,8,4,2,power_law_1.2,0.07642239928245545
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,6144,16384,2,8,4,2,power_law_1.2,6.770630645751953
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,6144,16384,2,8,4,2,power_law_1.2,0.10178560018539429
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,6144,16384,2,8,4,2,power_law_1.2,0.06391680240631104
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,6144,16384,2,8,4,2,power_law_1.2,11.146099090576172
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,6144,16384,2,8,4,2,power_law_1.2,0.0998848021030426
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,6144,16384,2,8,4,2,power_law_1.2,0.061504000425338747
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,6144,16384,2,8,4,2,power_law_1.2,0.06588799953460693
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,6144,16384,2,8,4,2,power_law_1.2,0.10557440519332886
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,6144,16384,2,8,8,1,balanced,0.04994133114814758
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,6144,16384,2,8,4,2,power_law_1.2,0.1007423996925354
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,6144,16384,2,8,8,1,balanced,0.06804266571998596
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,6144,16384,2,8,4,2,power_law_1.2,0.1148095965385437
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,6144,16384,2,8,4,2,power_law_1.2,21.99321594238281
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,6144,16384,2,8,4,2,power_law_1.2,0.10071040391921997
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,6144,16384,2,8,8,1,balanced,0.0654666672150294
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,6144,16384,2,8,4,2,power_law_1.2,0.10693119764328003
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,6144,16384,2,8,8,1,balanced,0.09780266880989075
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,6144,16384,2,8,4,2,power_law_1.2,0.11253119707107544
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,6144,16384,2,8,8,1,balanced,0.09975467125574748
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,6144,16384,2,8,4,2,power_law_1.2,0.11841919422149658
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,6144,16384,2,8,4,2,power_law_1.2,0.12192000150680542
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,6144,16384,2,8,8,1,balanced,0.16266133387883505
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,6144,16384,2,8,8,1,balanced,0.1025279959042867
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,6144,16384,2,8,4,2,power_law_1.2,0.12321280241012574
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,6144,16384,2,8,4,2,power_law_1.2,0.13013119697570802
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,6144,16384,2,8,8,1,balanced,0.16369600097338358
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,6144,16384,2,8,8,1,balanced,0.10454400380452473
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,6144,16384,2,8,4,2,power_law_1.2,0.12148480415344239
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,6144,16384,2,8,8,1,balanced,0.1050879955291748
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,6144,16384,2,8,8,1,balanced,0.16513599952061972
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,6144,16384,2,8,8,1,balanced,0.10618133346239726
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,6144,16384,2,8,4,2,power_law_1.2,0.1317952036857605
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,6144,16384,2,8,8,1,balanced,0.10672000050544739
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,6144,16384,2,8,8,1,balanced,0.16690667470296225
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,6144,16384,2,8,4,2,power_law_1.2,0.12723840475082399
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,6144,16384,2,8,4,2,power_law_1.2,0.13093119859695435
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,6144,16384,2,8,8,1,balanced,0.10712533195813496
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,6144,16384,2,8,4,2,power_law_1.2,0.13100800514221192
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,6144,16384,2,8,8,1,balanced,0.1680319905281067
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,6144,16384,2,8,8,1,balanced,0.1083519955476125
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,6144,16384,2,8,4,2,power_law_1.2,0.15868799686431884
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,6144,16384,2,8,8,1,balanced,0.16911466916402182
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,6144,16384,2,8,8,1,balanced,0.11111467083295186
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,6144,16384,2,8,4,2,power_law_1.2,0.16503039598464966
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,6144,16384,2,8,8,1,balanced,0.11424000064531963
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,6144,16384,2,8,8,1,balanced,0.1748746633529663
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,6144,16384,2,8,8,1,balanced,0.11683199803034465
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,6144,16384,2,8,4,2,power_law_1.2,0.1265727996826172
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,6144,16384,2,8,4,2,power_law_1.2,0.17896319627761842
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,6144,16384,2,8,8,1,balanced,0.12576533357302347
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,6144,16384,2,8,8,1,balanced,0.1758026679356893
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,6144,16384,2,8,4,2,power_law_1.2,0.13727999925613404
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,6144,16384,2,8,4,2,power_law_1.2,0.20417280197143556
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,6144,16384,2,8,8,1,balanced,0.1341813306013743
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,6144,16384,2,8,8,1,balanced,0.18153067429860434
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,6144,16384,2,8,4,2,power_law_1.2,0.1409152030944824
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,6144,16384,2,8,4,2,power_law_1.2,0.26431999206542967
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,6144,16384,2,8,8,1,balanced,0.13565867145856222
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,6144,16384,2,8,4,2,power_law_1.2,0.15841920375823976
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,6144,16384,2,8,8,1,balanced,0.18265599012374878
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,6144,16384,2,8,4,2,power_law_1.2,0.2739264011383057
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,6144,16384,2,8,8,1,balanced,0.15482667088508606
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,6144,16384,2,8,8,1,balanced,0.18428266048431396
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,6144,16384,2,8,4,2,power_law_1.2,0.3805311918258667
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,6144,16384,2,8,4,2,power_law_1.2,0.17940479516983032
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,6144,16384,2,8,8,1,balanced,0.18353599309921265
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,6144,16384,2,8,8,1,balanced,0.19965332746505737
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,6144,16384,2,8,4,2,power_law_1.2,0.1847808003425598
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,6144,16384,2,8,4,2,power_law_1.2,0.4326015949249268
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,6144,16384,2,8,8,1,balanced,0.1970240076382955
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,6144,16384,2,8,8,1,balanced,0.20336000124613443
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,6144,16384,2,8,4,2,power_law_1.2,0.22385919094085693
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,6144,16384,2,8,8,1,balanced,0.27007466554641724
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,6144,16384,2,8,4,2,power_law_1.2,0.645030403137207
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,6144,16384,2,8,8,1,balanced,0.2060906688372294
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,6144,16384,2,8,4,2,power_law_1.2,0.2989952087402344
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,6144,16384,2,8,8,1,balanced,0.3307253321011861
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,6144,16384,2,8,4,2,power_law_1.2,0.8221376419067383
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,6144,16384,2,8,8,1,balanced,0.24263999859491983
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,6144,16384,2,8,4,2,power_law_1.2,0.3578687906265259
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,6144,16384,2,8,8,1,balanced,0.47303998470306396
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,6144,16384,2,8,4,2,power_law_1.2,1.310598373413086
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,6144,16384,2,8,8,1,balanced,0.2780906756718953
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,6144,16384,2,8,4,2,power_law_1.2,0.5686016082763672
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,6144,16384,2,8,4,2,power_law_1.2,1.3456640243530273
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,6144,16384,2,8,8,1,balanced,0.6080906788508097
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,6144,16384,2,8,8,1,balanced,0.2781333327293396
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,6144,16384,2,8,4,2,power_law_1.2,0.6593279838562012
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,6144,16384,2,8,4,2,power_law_1.2,2.3267520904541015
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,6144,16384,2,8,8,1,balanced,0.8890346686045328
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,6144,16384,2,8,8,1,balanced,0.3866666555404663
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,6144,16384,2,8,4,2,power_law_1.2,1.0242752075195312
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,6144,16384,2,8,4,2,power_law_1.2,3.061017608642578
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,6144,16384,2,8,4,2,power_law_1.2,1.3021183967590333
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,6144,16384,2,8,8,1,balanced,0.4757386843363444
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,6144,16384,2,8,8,1,balanced,1.1598026752471924
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,6144,16384,2,8,4,2,power_law_1.2,2.0473024368286135
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,6144,16384,2,8,4,2,power_law_1.2,4.103187179565429
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,6144,16384,2,8,8,1,balanced,0.6801013151804606
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,6144,16384,2,8,4,2,power_law_1.2,2.787276840209961
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,6144,16384,2,8,4,2,power_law_1.2,6.273318481445313
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,6144,16384,2,8,4,2,power_law_1.2,3.9533119201660156
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,6144,16384,2,8,8,1,balanced,1.7163039843241374
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,6144,16384,2,8,8,1,balanced,0.8809920152028402
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,6144,16384,2,8,4,2,power_law_1.2,6.064870452880859
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,6144,16384,2,8,4,2,power_law_1.2,12.343468475341798
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,6144,16384,2,8,8,1,balanced,1.2796746889750164
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,6144,16384,2,8,4,2,power_law_1.2,7.858054351806641
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,6144,16384,2,8,8,1,balanced,2.263322671254476
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,6144,16384,2,8,8,1,balanced,0.04602666695912679
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,6144,16384,2,8,8,1,balanced,1.7332372665405273
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,6144,16384,2,8,4,2,power_law_1.2,11.201209259033202
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,6144,16384,2,8,8,1,power_law_1.01,0.06610559821128845
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,6144,16384,2,8,8,1,balanced,0.061936000982920326
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,6144,16384,2,8,8,1,balanced,2.7919254302978516
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,6144,16384,2,8,8,1,balanced,0.09701866904894511
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,6144,16384,2,8,4,2,power_law_1.2,20.97838134765625
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,6144,16384,2,8,8,1,power_law_1.01,0.08144000172615051
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,6144,16384,2,8,8,1,balanced,2.5591467221577964
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,6144,16384,2,8,8,1,balanced,0.10009066263834636
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,6144,16384,2,8,8,1,power_law_1.01,0.10393600463867188
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,6144,16384,2,8,8,1,balanced,0.1020960013071696
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,6144,16384,2,8,8,1,power_law_1.01,0.15326720476150513
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,6144,16384,2,8,8,1,balanced,0.10386133193969727
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,6144,16384,2,8,8,1,balanced,3.4032694498697915
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,6144,16384,2,8,8,1,power_law_1.01,0.15807360410690308
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,6144,16384,2,8,8,1,balanced,0.10528533657391866
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,6144,16384,2,8,8,1,balanced,4.4346879323323565
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,6144,16384,2,8,8,1,power_law_1.01,0.17002880573272705
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,6144,16384,2,8,8,1,balanced,0.10588799913724263
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,6144,16384,2,8,8,1,power_law_1.01,0.17093119621276856
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,6144,16384,2,8,8,1,balanced,4.219194730122884
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,6144,16384,2,8,8,1,power_law_1.01,0.17464959621429443
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,6144,16384,2,8,8,1,power_law_1.01,0.18666239976882934
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,6144,16384,2,8,8,1,power_law_1.01,0.202508807182312
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,6144,16384,2,8,8,1,balanced,0.10987200339635213
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,6144,16384,2,8,8,1,power_law_1.01,0.1962623953819275
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,6144,16384,2,8,8,1,balanced,0.11167466640472412
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,6144,16384,2,8,8,1,power_law_1.01,0.20190720558166503
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,6144,16384,2,8,8,1,balanced,6.625658671061198
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,6144,16384,2,8,8,1,balanced,8.697626749674479
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,6144,16384,2,8,8,1,power_law_1.01,0.21010560989379884
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,6144,16384,2,8,8,1,power_law_1.01,0.2520960092544556
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,6144,16384,2,8,8,1,power_law_1.01,0.04645760059356689
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,6144,16384,2,8,8,1,power_law_1.01,0.256057596206665
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,6144,16384,2,8,8,1,power_law_1.01,0.05372160077095032
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,6144,16384,2,8,8,1,power_law_1.01,0.2593408107757568
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,6144,16384,2,8,8,1,power_law_1.01,0.07221119999885559
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,6144,16384,2,8,8,1,power_law_1.01,0.3236479997634888
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,6144,16384,2,8,8,1,power_law_1.01,0.10001920461654663
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,6144,16384,2,8,8,1,power_law_1.01,0.36798720359802245
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,6144,16384,2,8,8,1,balanced,0.11758933464686076
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,6144,16384,2,8,8,1,power_law_1.01,0.10162559747695923
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,6144,16384,2,8,8,1,power_law_1.01,0.36180479526519777
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,6144,16384,2,8,8,1,balanced,0.12261333068211873
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,6144,16384,2,8,8,1,power_law_1.01,0.10607999563217163
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,6144,16384,2,8,8,1,balanced,13.47479502360026
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,6144,16384,2,8,8,1,power_law_1.01,0.47458558082580565
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,6144,16384,2,8,8,1,balanced,0.12648533781369528
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,6144,16384,2,8,8,1,power_law_1.01,0.1087231993675232
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,6144,16384,2,8,8,1,power_law_1.01,0.5725312232971191
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,6144,16384,2,8,8,1,power_law_1.01,0.1118399977684021
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,6144,16384,2,8,8,1,balanced,0.13176533579826355
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,6144,16384,2,8,8,1,power_law_1.01,0.7871039867401123
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,6144,16384,2,8,8,1,power_law_1.01,0.11352959871292115
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,6144,16384,2,8,8,1,balanced,0.15237333377202353
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,6144,16384,2,8,8,1,power_law_1.01,0.9793600082397461
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,6144,16384,2,8,8,1,power_law_1.01,0.11407359838485717
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,6144,16384,2,8,8,1,balanced,0.15786666671435037
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,6144,16384,2,8,8,1,power_law_1.01,1.3768768310546875
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,6144,16384,2,8,8,1,power_law_1.01,0.11822719573974609
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,6144,16384,2,8,8,1,balanced,0.1696000099182129
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,6144,16384,2,8,8,1,power_law_1.01,1.777984046936035
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,6144,16384,2,8,8,1,power_law_1.01,0.12055039405822754
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,6144,16384,2,8,8,1,balanced,0.24420799811681113
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,6144,16384,2,8,8,1,power_law_1.01,0.12558079957962037
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,6144,16384,2,8,8,1,power_law_1.01,2.6357824325561525
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,6144,16384,2,8,8,1,balanced,0.2746346592903137
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,6144,16384,2,8,8,1,power_law_1.01,0.15308799743652343
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,6144,16384,2,8,8,1,balanced,0.40862401326497394
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,6144,16384,2,8,8,1,power_law_1.01,3.540332794189453
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,6144,16384,2,8,8,1,power_law_1.01,0.1596735954284668
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,6144,16384,2,8,8,1,balanced,0.5358080069224039
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,6144,16384,2,8,8,1,power_law_1.01,4.423603057861328
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,6144,16384,2,8,8,1,power_law_1.01,0.16331520080566406
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,6144,16384,2,8,8,1,power_law_1.01,0.04431999921798706
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,6144,16384,2,8,8,1,power_law_1.01,6.759033966064453
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,6144,16384,2,8,8,1,balanced,0.8056159814198812
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,6144,16384,2,8,8,1,power_law_1.01,0.19658880233764647
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,6144,16384,2,8,8,1,power_law_1.01,0.055302399396896365
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,6144,16384,2,8,8,1,power_law_1.01,0.22164480686187743
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,6144,16384,2,8,8,1,balanced,1.0569653511047363
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,6144,16384,2,8,8,1,power_law_1.01,0.060236799716949466
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,6144,16384,2,8,8,1,power_law_1.01,13.692172241210937
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,6144,16384,2,8,8,1,power_law_1.01,0.2322688102722168
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,6144,16384,2,8,8,1,power_law_1.01,0.0983295977115631
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,6144,16384,2,8,8,1,balanced,1.5899465878804524
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,6144,16384,2,8,8,1,power_law_1.01,0.3124480009078979
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,6144,16384,2,8,8,1,power_law_1.01,0.09745280146598816
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,6144,16384,2,8,8,1,power_law_1.01,0.3797568082809448
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,6144,16384,2,8,8,1,power_law_1.01,0.10895999670028686
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,6144,16384,2,8,8,1,balanced,2.0957600275675454
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,6144,16384,2,8,8,1,power_law_1.01,0.5124671936035157
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,6144,16384,2,8,8,1,power_law_1.01,0.11501439809799194
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,6144,16384,2,8,8,1,power_law_1.01,0.12485120296478272
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,6144,16384,2,8,8,1,power_law_1.01,0.6511295795440674
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,6144,16384,2,8,8,1,balanced,3.1208693186442056
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,6144,16384,2,8,8,1,power_law_1.01,0.9324095726013184
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,6144,16384,2,8,8,1,power_law_1.01,1.1844672203063964
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,6144,16384,2,8,8,1,power_law_1.01,0.12064640522003174
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,6144,16384,2,8,8,1,balanced,4.167695999145508
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,6144,16384,2,8,8,1,power_law_1.01,0.1277119994163513
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,6144,16384,2,8,8,1,power_law_1.01,1.7146495819091796
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,6144,16384,2,8,8,1,power_law_1.01,2.311289596557617
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,6144,16384,2,8,8,1,balanced,5.190026601155599
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,6144,16384,2,8,8,1,power_law_1.01,0.12698880434036255
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,6144,16384,2,8,8,1,power_law_1.01,2.9069055557250976
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,6144,16384,2,8,8,1,power_law_1.01,0.13220479488372802
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,6144,16384,2,8,8,1,power_law_1.01,4.404217529296875
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,6144,16384,2,8,8,1,power_law_1.01,0.13664640188217164
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,6144,16384,2,8,8,1,power_law_1.01,0.15546879768371583
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,6144,16384,2,8,8,1,power_law_1.01,8.70948486328125
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,6144,16384,2,8,8,1,balanced,8.284367879231771
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,6144,16384,2,8,8,1,power_law_1.01,0.16847360134124756
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,6144,16384,2,8,8,1,power_law_1.01,0.17431679964065552
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,6144,16384,2,8,8,1,power_law_1.01,0.21071360111236573
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,6144,16384,2,8,8,1,power_law_1.01,0.2655103921890259
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,6144,16384,2,8,8,1,power_law_1.01,0.32704639434814453
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,6144,16384,2,8,8,1,power_law_1.01,0.4667967796325684
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,6144,16384,2,8,8,1,power_law_1.01,0.5850175857543946
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,6144,16384,2,8,8,1,power_law_1.01,0.8447999954223633
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,6144,16384,2,8,8,1,power_law_1.2,0.06284160017967225
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,6144,16384,2,8,8,1,balanced,16.588751475016277
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,6144,16384,2,8,8,1,power_law_1.01,1.1030400276184082
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,6144,16384,2,8,8,1,power_law_1.2,0.048921599984169006
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,6144,16384,2,8,8,1,power_law_1.2,0.08625919818878174
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,6144,16384,2,8,8,1,power_law_1.2,0.095551997423172
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,6144,16384,2,8,8,1,power_law_1.01,1.604960060119629
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,6144,16384,2,8,8,1,power_law_1.2,0.15762560367584227
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,6144,16384,2,8,8,1,power_law_1.2,0.055980801582336426
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,6144,16384,2,8,8,1,power_law_1.01,2.1241600036621096
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,6144,16384,2,8,8,1,power_law_1.2,0.16412800550460815
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,6144,16384,2,8,8,1,power_law_1.2,0.07237120270729065
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,6144,16384,2,8,8,1,power_law_1.2,0.16858240365982055
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,6144,16384,2,8,8,1,power_law_1.2,0.17618559598922728
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,6144,16384,2,8,8,1,power_law_1.2,0.09827200174331666
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,6144,16384,2,8,8,1,power_law_1.01,3.149964714050293
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,6144,16384,2,8,8,1,power_law_1.2,0.17734400033950806
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,6144,16384,2,8,8,1,power_law_1.2,0.10236799716949463
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,6144,16384,2,8,8,1,power_law_1.01,4.148460769653321
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,6144,16384,2,8,8,1,power_law_1.2,0.2033535957336426
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,6144,16384,2,8,8,1,power_law_1.2,0.2019200086593628
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,6144,16384,2,8,8,1,power_law_1.2,0.10585600137710571
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,6144,16384,2,8,8,1,power_law_1.01,5.182502365112304
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,6144,16384,2,8,8,1,power_law_1.2,0.194758403301239
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,6144,16384,2,8,8,1,power_law_1.2,0.11055999994277954
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,6144,16384,2,8,8,1,power_law_1.2,0.19816960096359254
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,6144,16384,2,8,8,1,power_law_1.2,0.2060159921646118
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,6144,16384,2,8,8,1,power_law_1.2,0.1121216058731079
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,6144,16384,2,8,8,1,power_law_1.01,8.267558288574218
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,6144,16384,2,8,8,1,power_law_1.2,0.24165759086608887
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,6144,16384,2,8,8,1,power_law_1.2,0.11313920021057129
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,6144,16384,2,8,8,1,power_law_1.2,0.25445759296417236
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,6144,16384,2,8,8,1,power_law_1.2,0.11558400392532349
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,6144,16384,2,8,8,1,power_law_1.2,0.26209919452667235
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,6144,16384,2,8,8,1,power_law_1.01,16.572096252441405
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,6144,16384,2,8,8,1,power_law_1.2,0.11854079961776734
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,6144,16384,2,8,8,1,power_law_1.2,0.3190848112106323
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,6144,16384,2,8,8,1,power_law_1.2,0.3422719955444336
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,6144,16384,2,8,8,1,power_law_1.2,0.12225279808044434
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,6144,16384,2,8,8,1,power_law_1.2,0.34992640018463134
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,6144,16384,2,8,8,1,power_law_1.2,0.1268928050994873
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,6144,16384,2,8,8,1,power_law_1.2,0.46272640228271483
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,6144,16384,2,8,8,1,power_law_1.2,0.5688447952270508
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,6144,16384,2,8,8,1,power_law_1.2,0.14910720586776732
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,6144,16384,2,8,8,1,power_law_1.2,0.7772480010986328
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,6144,16384,2,8,8,1,power_law_1.2,0.16120959520339967
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,6144,16384,2,8,8,1,power_law_1.2,0.9756352424621582
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,6144,16384,2,8,8,1,power_law_1.2,1.3826623916625977
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,6144,16384,2,8,8,1,power_law_1.2,0.1625663995742798
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,6144,16384,2,8,8,1,power_law_1.2,1.7803647994995118
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,6144,16384,2,8,8,1,power_law_1.2,0.20495359897613524
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,6144,16384,2,8,8,1,power_law_1.2,0.04523519873619079
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,6144,16384,2,8,8,1,power_law_1.2,2.642201614379883
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,6144,16384,2,8,8,1,power_law_1.2,0.22264959812164306
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,6144,16384,2,8,8,1,power_law_1.2,0.05386880040168762
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,6144,16384,2,8,8,1,power_law_1.2,3.557177734375
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,6144,16384,2,8,8,1,power_law_1.2,0.2400576114654541
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,6144,16384,2,8,8,1,power_law_1.2,0.05849599838256836
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,6144,16384,2,8,8,1,power_law_1.2,4.468947219848633
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,6144,16384,2,8,8,1,power_law_1.2,0.31233921051025393
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,6144,16384,2,8,8,1,power_law_1.2,0.09957759976387023
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,6144,16384,2,8,8,1,power_law_1.2,6.796403503417968
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,6144,16384,2,8,8,1,power_law_1.2,0.3708159923553467
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,6144,16384,2,8,8,1,power_law_1.2,0.1003648042678833
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,6144,16384,2,8,8,1,power_law_1.2,13.747276306152344
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,6144,16384,2,8,8,1,power_law_1.2,0.515718412399292
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,6144,16384,2,8,8,1,power_law_1.2,0.11009279489517212
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,6144,16384,2,8,8,1,power_law_1.2,0.6548672199249268
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,6144,16384,2,8,8,1,power_law_1.2,0.11416319608688355
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,6144,16384,2,8,8,1,power_law_1.2,0.12177920341491699
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,6144,16384,2,8,8,1,power_law_1.2,0.9387392044067383
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,6144,16384,2,8,8,1,power_law_1.2,1.1973952293395995
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,6144,16384,2,8,8,1,power_law_1.2,1.7157184600830078
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,6144,16384,2,8,8,1,power_law_1.2,0.12316800355911255
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,6144,16384,2,8,8,1,power_law_1.2,2.3373952865600587
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,6144,16384,2,8,8,1,power_law_1.2,0.13200639486312865
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,6144,16384,2,8,8,1,power_law_1.2,2.909619140625
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,6144,16384,2,8,8,1,power_law_1.2,4.406342315673828
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,6144,16384,2,8,8,1,power_law_1.2,0.12789119482040406
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,6144,16384,2,8,8,1,power_law_1.2,0.13348480463027954
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,6144,16384,2,8,8,1,power_law_1.2,8.720256042480468
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,6144,16384,2,8,8,1,power_law_1.2,0.13585280179977416
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,6144,16384,2,8,8,1,power_law_1.2,0.15717120170593263
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,6144,16384,2,8,8,1,power_law_1.2,0.169376003742218
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,6144,16384,2,8,8,1,power_law_1.2,0.17611520290374755
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,7168,2048,8,256,1,8,balanced,0.07237333556016286
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,6144,16384,2,8,8,1,power_law_1.2,0.21157760620117189
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,6144,16384,2,8,8,1,power_law_1.2,0.26698880195617675
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,7168,2048,8,256,1,8,balanced,0.08118933439254761
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,6144,16384,2,8,8,1,power_law_1.2,0.3309823989868164
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,7168,2048,8,256,1,8,balanced,0.12034666538238525
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,6144,16384,2,8,8,1,power_law_1.2,0.4533247947692871
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,7168,2048,8,256,1,8,balanced,0.20739734172821045
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,6144,16384,2,8,8,1,power_law_1.2,0.5806591987609864
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,7168,2048,8,256,1,8,balanced,0.365664005279541
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,7168,2048,8,256,1,8,balanced,0.6916266282399496
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,6144,16384,2,8,8,1,power_law_1.2,0.8272512435913086
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,7168,2048,8,256,1,8,balanced,0.6869440078735352
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,6144,16384,2,8,8,1,power_law_1.2,1.0948351860046386
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,7168,2048,8,256,1,8,balanced,0.6918666362762451
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,6144,16384,2,8,8,1,power_law_1.2,1.591916847229004
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,7168,2048,8,256,1,8,balanced,0.6918026606241862
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,6144,16384,2,8,8,1,power_law_1.2,2.117433547973633
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,7168,2048,8,256,1,8,balanced,0.6944906711578369
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,6144,16384,2,8,8,1,power_law_1.2,3.132736015319824
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,7168,2048,8,256,1,8,balanced,0.6971253554026285
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,6144,16384,2,8,8,1,power_law_1.2,4.146099090576172
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,7168,2048,8,256,1,8,balanced,0.69595734278361
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,7168,2048,8,256,1,8,balanced,0.7018667062123617
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,6144,16384,2,8,8,1,power_law_1.2,5.179334259033203
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,7168,2048,8,256,1,8,balanced,0.05506666501363119
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,7168,2048,8,256,1,8,balanced,0.6967946688334147
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,7168,2048,8,256,1,8,balanced,0.06291733185450236
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,6144,16384,2,8,8,1,power_law_1.2,8.248274993896484
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,7168,2048,8,256,1,8,balanced,0.7057226498921713
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,7168,2048,8,256,1,8,balanced,0.08232533435026805
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,7168,2048,8,256,1,8,balanced,0.12820800145467123
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,7168,2048,8,256,1,8,balanced,0.7093066374460856
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,6144,16384,2,8,8,1,power_law_1.2,16.483743286132814
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,7168,2048,8,256,1,8,balanced,0.20854934056599936
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,7168,2048,8,256,1,8,balanced,0.7187999884287516
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,7168,2048,8,256,1,8,balanced,0.37413867314656574
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,7168,2048,8,256,1,8,balanced,0.7547039985656738
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,7168,2048,8,256,1,8,balanced,0.3710826635360718
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,7168,2048,8,256,1,8,balanced,0.3747466802597046
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,7168,2048,8,256,1,8,balanced,0.7691199779510498
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,7168,2048,8,256,1,8,balanced,0.37693333625793457
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,7168,2048,8,256,1,8,balanced,0.3752053181330363
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,7168,2048,8,256,1,8,balanced,0.7863360246022543
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,7168,2048,8,256,1,8,balanced,0.37786134084065753
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,7168,2048,8,256,1,8,balanced,0.3839840094248454
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,7168,2048,8,256,1,8,balanced,0.8375893433888754
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,7168,2048,8,256,1,8,balanced,0.3837759892145793
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,7168,2048,8,256,1,8,balanced,0.3880266745885213
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,7168,2048,8,256,1,8,balanced,0.8789920012156168
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,7168,2048,8,256,1,8,balanced,0.39874664942423504
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,7168,2048,8,256,1,8,balanced,0.40214399496714276
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,7168,2048,8,256,1,8,balanced,0.9223146438598633
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,7168,2048,8,256,1,8,balanced,0.4102666775385539
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,7168,2048,8,256,1,8,balanced,0.4262933333714803
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,7168,2048,8,256,1,8,balanced,0.44571201006571454
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,7168,2048,8,256,1,8,balanced,1.2044373353322346
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,7168,2048,8,256,1,8,balanced,0.47383467356363934
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,7168,2048,8,256,1,8,balanced,0.05386666456858317
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,7168,2048,8,256,1,8,power_law_1.01,0.2214400053024292
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,7168,2048,8,256,1,8,balanced,0.06457599997520447
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,7168,2048,8,256,1,8,balanced,0.5167466799418131
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,7168,2048,8,256,1,8,balanced,0.08724266290664673
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,7168,2048,8,256,1,8,power_law_1.01,0.3599103927612305
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,7168,2048,8,256,1,8,balanced,1.2912373542785645
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,7168,2048,8,256,1,8,balanced,0.13116799791653952
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,7168,2048,8,256,1,8,balanced,0.5708586772282919
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,7168,2048,8,256,1,8,power_law_1.01,0.23038721084594727
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,7168,2048,8,256,1,8,balanced,0.2250666618347168
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,7168,2048,8,256,1,8,power_law_1.01,0.2133120059967041
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,7168,2048,8,256,1,8,balanced,0.3734826644261678
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,7168,2048,8,256,1,8,balanced,0.3766186634699504
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,7168,2048,8,256,1,8,power_law_1.01,0.2941375970840454
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,7168,2048,8,256,1,8,balanced,0.6309333244959513
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,7168,2048,8,256,1,8,balanced,0.37563733259836835
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,7168,2048,8,256,1,8,power_law_1.01,0.4255551815032959
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,7168,2048,8,256,1,8,balanced,0.3778453270594279
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,7168,2048,8,256,1,8,power_law_1.01,0.5165056228637696
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,7168,2048,8,256,1,8,balanced,1.7778080304463704
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,7168,2048,8,256,1,8,balanced,0.3803573449452718
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,7168,2048,8,256,1,8,balanced,0.8625760078430176
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,7168,2048,8,256,1,8,power_law_1.01,0.5622144222259522
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,7168,2048,8,256,1,8,balanced,0.3818240165710449
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,7168,2048,8,256,1,8,balanced,0.3851360082626343
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,7168,2048,8,256,1,8,power_law_1.01,0.5992896080017089
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,7168,2048,8,256,1,8,balanced,0.38921066125233966
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,7168,2048,8,256,1,8,power_law_1.01,0.5782400131225586
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,7168,2048,8,256,1,8,balanced,0.39140268166859943
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,7168,2048,8,256,1,8,power_law_1.01,0.5864640235900879
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,7168,2048,8,256,1,8,balanced,0.9706186453501383
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,7168,2048,8,256,1,8,balanced,0.40195198853810626
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,7168,2048,8,256,1,8,power_law_1.01,0.6314176082611084
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,7168,2048,8,256,1,8,power_law_1.01,0.13313280344009398
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,7168,2048,8,256,1,8,balanced,0.4068160057067871
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,7168,2048,8,256,1,8,power_law_1.01,0.6419583797454834
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,7168,2048,8,256,1,8,balanced,2.3024266560872397
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,7168,2048,8,256,1,8,power_law_1.01,0.2009216070175171
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,7168,2048,8,256,1,8,balanced,0.4185119867324829
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,7168,2048,8,256,1,8,power_law_1.01,0.6385280132293701
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,7168,2048,8,256,1,8,power_law_1.01,0.14224640130996705
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,7168,2048,8,256,1,8,power_law_1.01,0.6548992156982422
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,7168,2048,8,256,1,8,power_law_1.01,0.1299456000328064
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,7168,2048,8,256,1,8,power_law_1.01,0.6954944133758545
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,7168,2048,8,256,1,8,balanced,1.3554399808247883
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,7168,2048,8,256,1,8,power_law_1.01,0.1750656008720398
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,7168,2048,8,256,1,8,power_law_1.01,0.7251776218414306
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,7168,2048,8,256,1,8,power_law_1.01,0.2210304021835327
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,7168,2048,8,256,1,8,balanced,0.4456533193588257
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,7168,2048,8,256,1,8,power_law_1.01,0.8656384468078613
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,7168,2048,8,256,1,8,power_law_1.01,0.29689600467681887
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,7168,2048,8,256,1,8,power_law_1.01,0.85928316116333
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,7168,2048,8,256,1,8,power_law_1.01,0.303110408782959
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,7168,2048,8,256,1,8,power_law_1.01,1.0360704421997071
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,7168,2048,8,256,1,8,power_law_1.01,0.32157440185546876
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,7168,2048,8,256,1,8,power_law_1.01,0.13612159490585327
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,7168,2048,8,256,1,8,power_law_1.01,0.958790397644043
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,7168,2048,8,256,1,8,balanced,2.827338536580404
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,7168,2048,8,256,1,8,power_law_1.01,0.3252032041549683
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,7168,2048,8,256,1,8,power_law_1.01,0.21736960411071776
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,7168,2048,8,256,1,8,power_law_1.01,1.1697664260864258
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,7168,2048,8,256,1,8,balanced,1.751754601796468
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,7168,2048,8,256,1,8,power_law_1.01,0.3055999994277954
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,7168,2048,8,256,1,8,power_law_1.01,0.1369920015335083
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,7168,2048,8,256,1,8,power_law_1.01,1.3398591995239257
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,7168,2048,8,256,1,8,power_law_1.01,0.34041600227355956
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,7168,2048,8,256,1,8,power_law_1.01,0.14280320405960084
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,256,1,8,balanced,0.4737279812494914
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,7168,2048,8,256,1,8,power_law_1.01,1.67825927734375
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,7168,2048,8,256,1,8,power_law_1.01,0.17953280210494996
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,7168,2048,8,256,1,8,power_law_1.01,0.3409856081008911
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,7168,2048,8,256,1,8,power_law_1.01,0.23342719078063964
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,256,1,8,balanced,0.522325317064921
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,7168,2048,8,256,1,8,power_law_1.01,0.36248319149017333
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,7168,2048,8,256,1,8,power_law_1.01,2.268166351318359
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,7168,2048,8,256,1,8,power_law_1.01,0.3026112079620361
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,7168,2048,8,256,1,8,power_law_1.01,0.4031871795654297
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,7168,2048,8,256,1,8,power_law_1.01,2.9447168350219726
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,7168,2048,8,256,1,8,power_law_1.01,0.3199039936065674
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,256,1,8,balanced,0.568613330523173
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,7168,2048,8,256,1,8,power_law_1.01,0.4222720146179199
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,7168,2048,8,256,1,8,power_law_1.01,0.3178303956985474
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,7168,2048,8,256,1,8,power_law_1.01,4.085043334960938
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,7168,2048,8,256,1,8,power_law_1.01,0.4148416042327881
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,7168,2048,8,256,1,8,power_law_1.01,0.3269695997238159
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,256,1,8,balanced,0.713818629582723
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,7168,2048,8,256,1,8,power_law_1.01,0.3456383943557739
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,7168,2048,8,256,1,8,power_law_1.01,0.47704319953918456
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,7168,2048,8,256,1,8,power_law_1.01,4.716012954711914
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,7168,2048,8,256,1,8,power_law_1.01,0.3785984039306641
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,7168,2048,8,256,1,8,power_law_1.01,0.4932544231414795
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,7168,2048,8,256,1,8,balanced,2.1483893394470215
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,7168,2048,8,256,1,8,power_law_1.2,0.20817279815673828
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,7168,2048,8,256,1,8,power_law_1.01,0.36931838989257815
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,7168,2048,8,256,1,8,power_law_1.01,0.5847040176391601
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,7168,2048,8,256,1,8,power_law_1.01,7.011692810058594
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,7168,2048,8,256,1,8,power_law_1.01,0.4156479835510254
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,256,1,8,balanced,0.7936480045318604
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,7168,2048,8,256,1,8,power_law_1.2,0.36190080642700195
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,7168,2048,8,256,1,8,power_law_1.01,0.46915202140808104
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,7168,2048,8,256,1,8,power_law_1.01,0.5869247913360596
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,7168,2048,8,256,1,8,power_law_1.01,0.5028927803039551
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,7168,2048,8,256,1,8,power_law_1.2,0.1375488042831421
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,7168,2048,8,256,1,8,power_law_1.01,0.7132544040679931
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,7168,2048,8,256,1,8,power_law_1.01,12.928921508789063
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,7168,2048,8,256,1,8,power_law_1.01,0.5393472194671631
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,7168,2048,8,256,1,8,balanced,4.490917205810547
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,7168,2048,8,256,1,8,power_law_1.2,0.1861631989479065
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,7168,2048,8,256,1,8,power_law_1.01,0.8424192428588867
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,256,1,8,balanced,1.221728006998698
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,7168,2048,8,256,1,8,power_law_1.2,0.29059839248657227
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,7168,2048,8,256,1,8,power_law_1.01,1.1042688369750977
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,7168,2048,8,256,1,8,power_law_1.01,0.566707181930542
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,7168,2048,8,256,1,8,power_law_1.2,0.32302079200744627
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,7168,2048,8,256,1,8,power_law_1.01,1.417369556427002
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,7168,2048,8,256,1,8,power_law_1.2,0.5199808120727539
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,7168,2048,8,256,1,8,power_law_1.01,1.908198356628418
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,256,1,8,power_law_1.01,0.5291711807250976
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,7168,2048,8,256,1,8,power_law_1.2,0.5366911888122559
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,256,1,8,balanced,1.404080073038737
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,256,1,8,power_law_1.01,0.6457727909088135
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,7168,2048,8,256,1,8,power_law_1.01,2.3849727630615236
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,7168,2048,8,256,1,8,power_law_1.2,0.5294976234436035
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,256,1,8,power_law_1.01,0.8666048049926758
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,7168,2048,8,256,1,8,power_law_1.2,0.5238976001739502
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,7168,2048,8,256,1,8,power_law_1.01,3.3574337005615233
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,256,1,8,power_law_1.01,1.0319040298461915
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,256,1,8,power_law_1.01,1.2157567977905273
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,7168,2048,8,256,1,8,power_law_1.2,0.5662784099578857
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,7168,2048,8,256,1,8,power_law_1.01,4.975091171264649
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,7168,2048,8,256,1,8,balanced,3.3523572285970054
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,256,1,8,power_law_1.01,1.7273151397705078
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,7168,2048,8,256,1,8,power_law_1.2,0.6022528171539306
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,256,1,8,power_law_1.01,2.1216064453125
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,256,1,8,balanced,2.064730644226074
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,7168,2048,8,256,1,8,power_law_1.2,0.6428736209869385
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,7168,2048,8,256,1,8,power_law_1.01,8.917171478271484
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,256,1,8,power_law_1.01,3.19048957824707
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,7168,2048,8,256,1,8,power_law_1.2,0.6685247898101807
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,256,1,8,power_law_1.01,3.7152126312255858
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,7168,2048,8,256,1,8,power_law_1.2,0.6822527885437012
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,256,1,8,power_law_1.01,4.987551879882813
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,7168,2048,8,256,1,8,power_law_1.2,0.739251184463501
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,256,1,8,power_law_1.01,7.474214172363281
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,7168,2048,8,256,1,8,power_law_1.2,0.7962944030761718
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,7168,2048,8,256,1,8,power_law_1.2,0.8912768363952637
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,256,1,8,balanced,2.7250452041625977
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,256,1,8,power_law_1.01,15.57587127685547
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,7168,2048,8,256,1,8,power_law_1.2,0.9251392364501954
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,7168,2048,8,256,1,8,power_law_1.2,0.13284480571746826
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,7168,2048,8,256,1,8,power_law_1.2,1.2225536346435546
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,7168,2048,8,256,1,8,power_law_1.2,0.20039041042327882
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,7168,2048,8,256,1,8,power_law_1.2,1.0791680335998535
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,7168,2048,8,256,1,8,power_law_1.2,0.09315840005874634
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,7168,2048,8,256,1,8,power_law_1.2,1.270464038848877
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,7168,2048,8,256,1,8,power_law_1.2,0.13100800514221192
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,7168,2048,8,256,1,8,power_law_1.2,1.4017855644226074
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,7168,2048,8,256,1,8,power_law_1.2,0.1535104036331177
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,7168,2048,8,256,1,8,power_law_1.2,1.9680831909179688
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,7168,2048,8,256,1,8,power_law_1.2,0.21672959327697755
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,7168,2048,8,256,1,8,power_law_1.2,2.4976959228515625
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,7168,2048,8,256,1,8,power_law_1.2,0.29173760414123534
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,7168,2048,8,256,1,8,balanced,8.658896128336588
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,256,1,8,balanced,3.3902079264322915
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,7168,2048,8,256,1,8,power_law_1.2,3.413747024536133
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,7168,2048,8,256,1,8,power_law_1.2,0.29087998867034914
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,7168,2048,8,256,1,8,power_law_1.2,0.30138239860534666
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,7168,2048,8,256,1,8,power_law_1.2,4.211513519287109
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,7168,2048,8,256,1,8,power_law_1.2,0.32457599639892576
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,7168,2048,8,256,1,8,power_law_1.2,0.3257152080535889
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,7168,2048,8,256,1,8,power_law_1.2,6.360371017456055
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,7168,2048,8,256,1,8,power_law_1.2,0.33909759521484373
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,7168,2048,8,256,1,8,power_law_1.2,0.32666239738464353
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,7168,2048,8,256,1,8,power_law_1.2,9.340070343017578
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,7168,2048,8,256,1,8,power_law_1.2,0.37725439071655276
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,7168,2048,8,256,1,8,power_law_1.2,0.43994879722595215
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,7168,2048,8,256,1,8,power_law_1.2,0.43848958015441897
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,7168,2048,8,256,1,8,power_law_1.2,0.4467904090881348
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,7168,2048,8,256,1,8,balanced,6.627882639567058
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,7168,2048,8,256,1,8,power_law_1.2,17.506381225585937
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,7168,2048,8,256,1,8,power_law_1.2,0.5120575904846192
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,7168,2048,8,256,1,8,power_law_1.2,0.5186431884765625
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,7168,2048,8,256,1,8,power_law_1.2,0.6082176208496094
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,7168,2048,8,256,1,8,power_law_1.2,0.6158207893371582
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,7168,2048,8,256,1,8,power_law_1.2,0.7668159961700439
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,256,1,8,balanced,5.387125651041667
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,7168,2048,8,256,1,8,power_law_1.2,0.9159808158874512
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,7168,2048,8,256,1,8,power_law_1.2,1.2267392158508301
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,7168,2048,8,256,1,8,power_law_1.2,1.5318528175354005
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,7168,2048,8,256,1,8,power_law_1.2,2.167161560058594
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,7168,2048,8,256,1,8,power_law_1.2,2.9641088485717773
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,7168,2048,8,256,1,8,power_law_1.2,3.7920257568359377
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,7168,2048,8,256,1,8,power_law_1.2,5.588467025756836
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,7168,2048,8,256,1,8,power_law_1.2,11.83157730102539
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,256,1,8,balanced,10.985098520914713
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,7168,2048,8,256,1,8,power_law_1.2,0.14351359605789185
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,7168,2048,8,256,1,8,power_law_1.2,0.21353600025177003
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,7168,2048,8,256,2,4,balanced,0.06668266654014587
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,7168,2048,8,256,1,8,power_law_1.2,0.08909440040588379
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,7168,2048,8,256,2,4,balanced,0.08142933249473572
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,7168,2048,8,256,1,8,power_law_1.2,0.11941759586334229
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,7168,2048,8,256,2,4,balanced,0.12151466806729634
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,7168,2048,8,256,1,8,power_law_1.2,0.16796799898147582
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,7168,2048,8,256,2,4,balanced,0.20900267362594604
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,7168,2048,8,256,1,8,power_law_1.2,0.22234880924224854
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,7168,2048,8,256,2,4,balanced,0.36925868193308514
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,7168,2048,8,256,1,8,power_law_1.2,0.29342079162597656
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,7168,2048,8,256,2,4,balanced,0.6909973621368408
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,7168,2048,8,256,2,4,balanced,0.053029333551724754
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,7168,2048,8,256,1,8,power_law_1.2,0.2937855958938599
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,7168,2048,8,256,2,4,balanced,0.6917866865793864
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,7168,2048,8,256,2,4,balanced,0.06294933458169301
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,7168,2048,8,256,2,4,balanced,0.69706130027771
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,7168,2048,8,256,1,8,power_law_1.2,0.30693759918212893
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,7168,2048,8,256,2,4,balanced,0.08423466483751933
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,7168,2048,8,256,2,4,balanced,0.6990506649017334
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,7168,2048,8,256,1,8,power_law_1.2,0.30580480098724366
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,7168,2048,8,256,2,4,balanced,0.13051199913024902
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,7168,2048,8,256,2,4,balanced,0.7048266728719076
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,7168,2048,8,256,1,8,power_law_1.2,0.3532160043716431
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,7168,2048,8,256,2,4,balanced,0.20902933677037558
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,7168,2048,8,256,2,4,balanced,0.6967360178629557
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,7168,2048,8,256,1,8,power_law_1.2,0.3547967910766602
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,7168,2048,8,256,2,4,balanced,0.3720586697260539
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,7168,2048,8,256,2,4,balanced,0.7021493117014567
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,7168,2048,8,256,1,8,power_law_1.2,0.39946880340576174
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,7168,2048,8,256,2,4,balanced,0.3740853468577067
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,7168,2048,8,256,2,4,balanced,0.7037920157114664
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,7168,2048,8,256,2,4,balanced,0.3826613426208496
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,7168,2048,8,256,1,8,power_law_1.2,0.4224639892578125
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,7168,2048,8,256,2,4,balanced,0.3800373474756877
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,7168,2048,8,256,2,4,balanced,0.7105120023091634
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,7168,2048,8,256,1,8,power_law_1.2,0.45674881935119627
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,7168,2048,8,256,2,4,balanced,0.38255465030670166
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,7168,2048,8,256,2,4,balanced,0.7194506327311198
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,7168,2048,8,256,1,8,power_law_1.2,0.49947519302368165
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,7168,2048,8,256,2,4,balanced,0.3866080045700073
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,7168,2048,8,256,2,4,balanced,0.7237706979115804
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,7168,2048,8,256,1,8,power_law_1.2,0.551148796081543
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,7168,2048,8,256,2,4,balanced,0.39347732067108154
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,7168,2048,8,256,2,4,balanced,0.3959519863128662
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,7168,2048,8,256,2,4,balanced,0.7300960222880045
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,7168,2048,8,256,2,4,balanced,0.39665067195892334
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,7168,2048,8,256,2,4,balanced,0.7707093556722006
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,7168,2048,8,256,1,8,power_law_1.2,0.6137983798980713
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,7168,2048,8,256,2,4,balanced,0.40563734372456867
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,7168,2048,8,256,2,4,balanced,0.78875732421875
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,7168,2048,8,256,2,4,balanced,0.41160531838734943
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,7168,2048,8,256,2,4,balanced,0.06301333506902058
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,7168,2048,8,256,2,4,balanced,0.42107200622558594
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,256,1,8,power_law_1.2,0.5986495971679687
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,7168,2048,8,256,2,4,balanced,0.8166506290435791
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,7168,2048,8,256,2,4,balanced,0.44064001242319745
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,7168,2048,8,256,2,4,balanced,0.07141333321730296
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,256,1,8,power_law_1.2,0.7321343898773194
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,7168,2048,8,256,2,4,balanced,0.09337066610654195
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,7168,2048,8,256,2,4,balanced,0.47678931554158527
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,7168,2048,8,256,2,4,balanced,0.8773653507232666
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,256,1,8,power_law_1.2,0.9558143615722656
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,7168,2048,8,256,2,4,balanced,0.14335466424624124
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,7168,2048,8,256,2,4,balanced,0.5199626684188843
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,256,1,8,power_law_1.2,1.076313591003418
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,7168,2048,8,256,2,4,balanced,0.21617066860198975
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,7168,2048,8,256,2,4,balanced,0.9493119716644287
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,7168,2048,8,256,2,4,balanced,0.3808533350626628
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,256,1,8,power_law_1.2,1.405344009399414
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,7168,2048,8,256,2,4,balanced,0.5571893453598022
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,7168,2048,8,256,2,4,balanced,0.38202667236328125
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,256,1,8,power_law_1.2,1.9124479293823242
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,7168,2048,8,256,2,4,balanced,0.38395198186238605
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,7168,2048,8,256,2,4,power_law_1.01,0.0870848000049591
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,7168,2048,8,256,2,4,balanced,1.012778679529826
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,7168,2048,8,256,2,4,power_law_1.01,0.13137279748916625
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,7168,2048,8,256,2,4,balanced,0.6406240065892538
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,7168,2048,8,256,2,4,balanced,0.3880693515141805
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,256,1,8,power_law_1.2,2.688115119934082
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,7168,2048,8,256,2,4,power_law_1.01,0.19911680221557618
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,7168,2048,8,256,2,4,power_law_1.01,0.12223999500274658
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,7168,2048,8,256,2,4,balanced,0.3910293181737264
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,256,1,8,power_law_1.2,3.7530113220214845
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,7168,2048,8,256,2,4,power_law_1.01,0.07341439723968506
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,7168,2048,8,256,2,4,power_law_1.01,0.1260480046272278
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,7168,2048,8,256,2,4,balanced,0.7183307011922201
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,7168,2048,8,256,2,4,balanced,0.39306668440500897
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,7168,2048,8,256,2,4,balanced,1.3364799817403157
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,7168,2048,8,256,2,4,power_law_1.01,0.18533120155334473
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,7168,2048,8,256,2,4,power_law_1.01,0.11510399580001832
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,256,1,8,power_law_1.2,5.083366394042969
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,7168,2048,8,256,2,4,balanced,0.3975359996159871
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,7168,2048,8,256,2,4,power_law_1.01,0.2846719980239868
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,7168,2048,8,256,2,4,power_law_1.01,0.1691648006439209
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,7168,2048,8,256,2,4,balanced,0.401962677637736
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,256,1,8,power_law_1.2,6.355961608886719
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,7168,2048,8,256,2,4,balanced,0.41195201873779297
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,7168,2048,8,256,2,4,balanced,0.9709973335266113
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,7168,2048,8,256,2,4,power_law_1.01,0.3733695983886719
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,7168,2048,8,256,2,4,power_law_1.01,0.2198335886001587
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,7168,2048,8,256,2,4,power_law_1.01,0.49482879638671873
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,7168,2048,8,256,2,4,balanced,0.4254666566848755
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,7168,2048,8,256,2,4,power_law_1.01,0.2751744031906128
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,256,1,8,power_law_1.2,10.075885009765624
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,7168,2048,8,256,2,4,balanced,1.456666628519694
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,7168,2048,8,256,2,4,power_law_1.01,0.09839360117912292
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,7168,2048,8,256,2,4,power_law_1.01,0.531276798248291
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,7168,2048,8,256,2,4,balanced,0.43192001183827716
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,7168,2048,8,256,2,4,power_law_1.01,0.2927808046340942
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,7168,2048,8,256,2,4,power_law_1.01,0.14191999435424804
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,7168,2048,8,256,2,4,power_law_1.01,0.5458176136016846
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,7168,2048,8,256,2,4,balanced,0.44728533426920575
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,7168,2048,8,256,2,4,power_law_1.01,0.29454081058502196
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,7168,2048,8,256,2,4,balanced,1.1309386889139812
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,7168,2048,8,256,2,4,power_law_1.01,0.11195520162582398
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,256,1,8,power_law_1.2,22.477830505371095
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,7168,2048,8,256,2,4,power_law_1.01,0.5498496055603027
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,7168,2048,8,256,2,4,power_law_1.01,0.30524160861968996
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,7168,2048,8,256,2,4,power_law_1.01,0.12108800411224366
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,7168,2048,8,256,2,4,power_law_1.01,0.5901120185852051
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,7168,2048,8,256,2,4,power_law_1.01,0.1723199963569641
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,7168,2048,8,256,2,4,power_law_1.01,0.3211456060409546
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,7168,2048,8,256,2,4,power_law_1.01,0.2097343921661377
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,7168,2048,8,256,2,4,power_law_1.01,0.6372159957885742
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,7168,2048,8,256,2,4,balanced,1.9967145919799805
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,7168,2048,8,256,2,4,power_law_1.01,0.33333120346069334
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,7168,2048,8,256,2,4,power_law_1.01,0.2955647945404053
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,7168,2048,8,256,2,4,power_law_1.01,0.6404863834381104
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,7168,2048,8,256,2,4,balanced,0.49305065472920734
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,7168,2048,8,256,2,4,power_law_1.01,0.30967040061950685
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,7168,2048,8,256,2,4,power_law_1.01,0.34993278980255127
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,7168,2048,8,256,2,4,power_law_1.01,0.3183039903640747
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,7168,2048,8,256,2,4,power_law_1.01,0.6365952014923095
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,7168,2048,8,256,2,4,balanced,1.6093920071919758
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,7168,2048,8,256,2,4,power_law_1.01,0.3254463911056519
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,7168,2048,8,256,2,4,power_law_1.01,0.3767551898956299
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,7168,2048,8,256,2,4,power_law_1.01,0.6477439880371094
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,7168,2048,8,256,2,4,power_law_1.01,0.3555392026901245
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,7168,2048,8,256,2,4,power_law_1.01,0.408735990524292
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,7168,2048,8,256,2,4,power_law_1.01,0.36504321098327636
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,7168,2048,8,256,2,4,power_law_1.01,0.666431999206543
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,7168,2048,8,256,2,4,power_law_1.01,0.43169279098510743
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,7168,2048,8,256,2,4,power_law_1.01,0.3846400022506714
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,7168,2048,8,256,2,4,power_law_1.01,0.7465983867645264
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,7168,2048,8,256,2,4,power_law_1.01,0.4116223812103271
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,7168,2048,8,256,2,4,power_law_1.01,0.4211775779724121
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,7168,2048,8,256,2,4,power_law_1.01,0.4455552101135254
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,7168,2048,8,256,2,4,power_law_1.01,0.7773248195648194
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,7168,2048,8,256,2,4,balanced,2.618618647257487
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,7168,2048,8,256,2,4,power_law_1.01,0.48236799240112305
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,7168,2048,8,256,2,4,power_law_1.01,0.48441600799560547
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,256,2,4,balanced,0.5497066577275594
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,7168,2048,8,256,2,4,power_law_1.01,0.5560128211975097
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,7168,2048,8,256,2,4,power_law_1.01,0.8671232223510742
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,7168,2048,8,256,2,4,power_law_1.01,0.5006400108337402
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,7168,2048,8,256,2,4,balanced,2.092485268910726
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,256,2,4,balanced,0.6416426499684652
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,7168,2048,8,256,2,4,power_law_1.01,1.0008447647094727
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,7168,2048,8,256,2,4,power_law_1.01,0.5722943782806397
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,7168,2048,8,256,2,4,power_law_1.01,0.616096019744873
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,7168,2048,8,256,2,4,power_law_1.01,0.6099584102630615
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,7168,2048,8,256,2,4,power_law_1.01,1.008902359008789
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,256,2,4,balanced,0.7002240022023519
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,7168,2048,8,256,2,4,power_law_1.01,0.7687808036804199
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,7168,2048,8,256,2,4,power_law_1.01,1.1658944129943847
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,7168,2048,8,256,2,4,power_law_1.2,0.13029760122299194
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,256,2,4,power_law_1.01,0.6253312110900879
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,7168,2048,8,256,2,4,power_law_1.01,1.3301376342773437
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,7168,2048,8,256,2,4,power_law_1.01,0.9167424201965332
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,256,2,4,balanced,0.9131413300832113
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,256,2,4,power_law_1.01,0.7817408084869385
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,7168,2048,8,256,2,4,power_law_1.2,0.20031359195709228
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,7168,2048,8,256,2,4,power_law_1.01,1.6716543197631837
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,7168,2048,8,256,2,4,power_law_1.01,1.2090432167053222
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,256,2,4,power_law_1.01,0.9269184112548828
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,7168,2048,8,256,2,4,power_law_1.2,0.11087360382080078
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,7168,2048,8,256,2,4,power_law_1.01,2.2503679275512694
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,256,2,4,power_law_1.01,1.1255743980407715
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,7168,2048,8,256,2,4,power_law_1.01,1.3935359954833983
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,256,2,4,balanced,1.056821346282959
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,7168,2048,8,256,2,4,balanced,3.2612053553263345
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,7168,2048,8,256,2,4,power_law_1.2,0.18312959671020507
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,256,2,4,power_law_1.01,1.454918384552002
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,7168,2048,8,256,2,4,power_law_1.01,2.757676887512207
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,7168,2048,8,256,2,4,power_law_1.01,2.0622400283813476
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,7168,2048,8,256,2,4,balanced,2.554426670074463
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,7168,2048,8,256,2,4,power_law_1.2,0.2526592016220093
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,256,2,4,power_law_1.01,1.9465215682983399
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,256,2,4,power_law_1.01,2.6154943466186524
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,7168,2048,8,256,2,4,power_law_1.01,3.5927360534667967
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,7168,2048,8,256,2,4,power_law_1.01,2.532032012939453
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,7168,2048,8,256,2,4,power_law_1.2,0.30443520545959474
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,256,2,4,balanced,1.6313707033793132
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,256,2,4,power_law_1.01,3.7056705474853517
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,7168,2048,8,256,2,4,power_law_1.2,0.47907199859619143
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,7168,2048,8,256,2,4,power_law_1.01,4.285580825805664
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,7168,2048,8,256,2,4,power_law_1.01,3.139865684509277
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,7168,2048,8,256,2,4,power_law_1.2,0.5238783836364747
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,256,2,4,power_law_1.01,4.496992111206055
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,7168,2048,8,256,2,4,power_law_1.2,0.5513088226318359
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,7168,2048,8,256,2,4,power_law_1.01,4.855583953857422
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,7168,2048,8,256,2,4,power_law_1.01,6.54163818359375
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,256,2,4,power_law_1.01,5.874860763549805
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,7168,2048,8,256,2,4,power_law_1.2,0.549292802810669
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,256,2,4,balanced,1.9238773981730144
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,256,2,4,power_law_1.01,9.372806549072266
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,7168,2048,8,256,2,4,power_law_1.2,0.5792768001556396
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,7168,2048,8,256,2,4,power_law_1.01,9.848544311523437
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,7168,2048,8,256,2,4,power_law_1.01,14.250810241699218
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,7168,2048,8,256,2,4,power_law_1.2,0.6101952075958252
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,7168,2048,8,256,2,4,power_law_1.2,0.6500991821289063
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,256,2,4,power_law_1.01,19.46972198486328
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,7168,2048,8,256,2,4,power_law_1.2,0.6567039966583252
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,7168,2048,8,256,2,4,power_law_1.2,0.6960639953613281
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,7168,2048,8,256,2,4,balanced,5.0913387934366865
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,256,2,4,balanced,2.85041077931722
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,7168,2048,8,256,2,4,power_law_1.2,0.7249472141265869
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,7168,2048,8,256,2,4,balanced,4.0782772699991865
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,7168,2048,8,256,2,4,power_law_1.2,0.7542335987091064
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,7168,2048,8,256,2,4,power_law_1.2,0.8522496223449707
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,7168,2048,8,256,2,4,power_law_1.2,0.8931584358215332
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,7168,2048,8,256,2,4,power_law_1.2,1.0318592071533204
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,7168,2048,8,256,2,4,power_law_1.2,1.0168959617614746
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,256,2,4,balanced,3.746906598409017
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,7168,2048,8,256,2,4,power_law_1.2,1.1916543960571289
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,7168,2048,8,256,2,4,power_law_1.2,1.4949440002441405
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,7168,2048,8,256,2,4,power_law_1.2,1.7844671249389648
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,7168,2048,8,256,2,4,power_law_1.2,2.249350357055664
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,7168,2048,8,256,2,4,power_law_1.2,3.1153728485107424
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,7168,2048,8,256,2,4,power_law_1.2,4.387360000610352
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,7168,2048,8,256,2,4,power_law_1.2,4.910726547241211
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,256,2,4,balanced,4.647760073343913
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,7168,2048,8,256,2,4,power_law_1.2,7.8476097106933596
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,7168,2048,8,256,2,4,power_law_1.2,17.51640930175781
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,7168,2048,8,256,2,4,balanced,8.039567947387695
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,7168,2048,8,256,2,4,balanced,10.304741541544596
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,256,2,4,balanced,7.410101572672526
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,7168,2048,8,256,2,4,power_law_1.2,0.08638719916343689
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,7168,2048,8,256,2,4,power_law_1.2,0.1184000015258789
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,7168,2048,8,256,2,4,power_law_1.2,0.07970560193061829
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,7168,2048,8,256,2,4,power_law_1.2,0.10881279706954956
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,7168,2048,8,256,2,4,power_law_1.2,0.1477247953414917
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,7168,2048,8,256,2,4,power_law_1.2,0.19045759439468385
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,7168,2048,8,256,2,4,power_law_1.2,0.27056639194488524
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,7168,2048,8,256,2,4,power_law_1.2,0.29049599170684814
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,7168,2048,8,256,2,4,power_law_1.2,0.3116031885147095
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,7168,2048,8,256,2,4,power_law_1.2,0.3168960094451904
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,7168,2048,8,256,2,4,power_law_1.2,0.31763200759887694
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,256,2,4,balanced,14.983509063720703
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,7168,2048,8,256,2,4,power_law_1.2,0.3356735944747925
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,7168,2048,8,256,2,4,power_law_1.2,0.3561088085174561
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,7168,2048,8,256,2,4,power_law_1.2,0.38927359580993653
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,7168,2048,8,256,2,4,power_law_1.2,0.40364799499511717
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,7168,2048,8,256,2,4,power_law_1.2,0.457919979095459
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,7168,2048,8,256,2,4,power_law_1.2,0.43459200859069824
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,7168,2048,8,256,2,4,power_law_1.2,0.5139647960662842
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,7168,2048,8,256,2,4,power_law_1.2,0.499238395690918
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,7168,2048,8,256,2,4,power_law_1.2,0.6165311813354493
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,7168,2048,8,256,2,4,power_law_1.2,0.6501696109771729
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,7168,2048,8,256,2,4,power_law_1.2,0.8065088272094727
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,7168,2048,8,256,2,4,power_law_1.2,0.9477631568908691
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,7168,2048,8,256,2,4,power_law_1.2,1.348953628540039
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,7168,2048,8,256,2,4,power_law_1.2,1.6069631576538086
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,7168,2048,8,256,4,2,balanced,0.07014399766921997
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,7168,2048,8,256,2,4,power_law_1.2,2.3023168563842775
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,7168,2048,8,256,4,2,balanced,0.054058666030565895
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,7168,2048,8,256,4,2,balanced,0.08293333152929942
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,7168,2048,8,256,4,2,balanced,0.12271466851234436
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,7168,2048,8,256,2,4,power_law_1.2,2.7084863662719725
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,7168,2048,8,256,4,2,balanced,0.06537599861621857
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,7168,2048,8,256,4,2,balanced,0.20599999030431113
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,7168,2048,8,256,4,2,balanced,0.08745066324869792
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,7168,2048,8,256,2,4,power_law_1.2,3.5738624572753905
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,7168,2048,8,256,4,2,balanced,0.37297598520914715
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,7168,2048,8,256,4,2,balanced,0.13699733217557272
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,7168,2048,8,256,2,4,power_law_1.2,0.09843840003013611
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,7168,2048,8,256,4,2,balanced,0.7006613413492838
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,7168,2048,8,256,4,2,balanced,0.22242132822672525
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,7168,2048,8,256,2,4,power_law_1.2,5.539174270629883
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,7168,2048,8,256,4,2,balanced,0.7085333665211996
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,7168,2048,8,256,2,4,power_law_1.2,0.14209920167922974
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,7168,2048,8,256,4,2,balanced,0.3877013524373372
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,7168,2048,8,256,4,2,balanced,0.7050453027089437
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,7168,2048,8,256,2,4,power_law_1.2,0.08305280208587647
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,7168,2048,8,256,4,2,balanced,0.3885600169499715
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,7168,2048,8,256,2,4,power_law_1.2,10.951789093017577
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,7168,2048,8,256,4,2,balanced,0.7125546932220459
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,7168,2048,8,256,4,2,balanced,0.38946131865183514
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,7168,2048,8,256,2,4,power_law_1.2,0.12010879516601562
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,7168,2048,8,256,4,2,balanced,0.39399464925130206
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,7168,2048,8,256,4,2,balanced,0.7098186810811361
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,7168,2048,8,256,2,4,power_law_1.2,0.1640064001083374
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,7168,2048,8,256,4,2,balanced,0.3949439922968547
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,7168,2048,8,256,4,2,balanced,0.712112029393514
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,7168,2048,8,256,2,4,power_law_1.2,0.206060791015625
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,7168,2048,8,256,4,2,balanced,0.40026132265726727
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,7168,2048,8,256,4,2,balanced,0.719264030456543
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,7168,2048,8,256,2,4,power_law_1.2,0.28396799564361574
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,7168,2048,8,256,4,2,balanced,0.40476266543070477
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,7168,2048,8,256,4,2,balanced,0.7227413654327393
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,7168,2048,8,256,2,4,power_law_1.2,0.3012351989746094
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,7168,2048,8,256,4,2,balanced,0.4099466800689697
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,7168,2048,8,256,4,2,balanced,0.7344160079956055
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,7168,2048,8,256,2,4,power_law_1.2,0.3168191909790039
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,7168,2048,8,256,4,2,balanced,0.4182826677958171
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,7168,2048,8,256,4,2,balanced,0.741050640741984
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,7168,2048,8,256,2,4,power_law_1.2,0.32537600994110105
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,7168,2048,8,256,4,2,balanced,0.43412800629933673
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,7168,2048,8,256,4,2,balanced,0.7468907038370768
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,7168,2048,8,256,2,4,power_law_1.2,0.3533184051513672
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,7168,2048,8,256,4,2,balanced,0.4382346471150716
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,7168,2048,8,256,4,2,balanced,0.7573653062184652
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,7168,2048,8,256,2,4,power_law_1.2,0.3733311891555786
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,7168,2048,8,256,4,2,balanced,0.46343998114267987
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,7168,2048,8,256,4,2,balanced,0.7962933381398519
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,7168,2048,8,256,2,4,power_law_1.2,0.403718376159668
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,7168,2048,8,256,4,2,balanced,0.4851040045420329
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,7168,2048,8,256,2,4,power_law_1.2,0.43250560760498047
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,7168,2048,8,256,4,2,balanced,0.8439253171284994
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,7168,2048,8,256,4,2,balanced,0.525269349416097
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,7168,2048,8,256,2,4,power_law_1.2,0.4666111946105957
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,7168,2048,8,256,4,2,balanced,0.8930239677429199
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,7168,2048,8,256,4,2,balanced,0.5854986508687338
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,7168,2048,8,256,2,4,power_law_1.2,0.5060287952423096
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,7168,2048,8,256,2,4,power_law_1.2,0.5728640079498291
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,7168,2048,8,256,4,2,balanced,0.9529653390248617
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,7168,2048,8,256,4,2,balanced,0.657477339108785
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,7168,2048,8,256,4,2,power_law_1.01,0.0815168023109436
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,7168,2048,8,256,4,2,balanced,1.0821013450622559
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,7168,2048,8,256,2,4,power_law_1.2,0.6630720138549805
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,7168,2048,8,256,4,2,balanced,0.7801012992858887
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,7168,2048,8,256,4,2,balanced,0.08457066615422566
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,7168,2048,8,256,4,2,power_law_1.01,0.1211583971977234
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,7168,2048,8,256,4,2,power_law_1.01,0.10303360223770142
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,7168,2048,8,256,4,2,balanced,0.09204799930254619
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,7168,2048,8,256,4,2,balanced,1.200762669245402
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,7168,2048,8,256,4,2,balanced,0.8952426910400391
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,256,2,4,power_law_1.2,0.6604415893554687
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,7168,2048,8,256,4,2,balanced,0.11107732852300008
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,7168,2048,8,256,4,2,power_law_1.01,0.1702911972999573
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,256,2,4,power_law_1.2,0.8182975769042968
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,7168,2048,8,256,4,2,balanced,0.16320533553759256
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,7168,2048,8,256,4,2,power_law_1.01,0.2666048049926758
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,7168,2048,8,256,4,2,balanced,0.24653865893681845
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,256,2,4,power_law_1.2,0.9758079528808594
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,7168,2048,8,256,4,2,balanced,1.57858673731486
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,7168,2048,8,256,4,2,power_law_1.01,0.3636543989181519
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,7168,2048,8,256,4,2,power_law_1.01,0.06542080044746398
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,7168,2048,8,256,4,2,balanced,1.2314026355743408
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,7168,2048,8,256,4,2,balanced,0.41944531599680585
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,256,2,4,power_law_1.2,1.223750400543213
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,7168,2048,8,256,4,2,power_law_1.01,0.4965824127197266
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,7168,2048,8,256,4,2,power_law_1.01,0.08369920253753663
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,7168,2048,8,256,4,2,balanced,0.42162132263183594
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,7168,2048,8,256,4,2,power_law_1.01,0.5380735874176026
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,256,2,4,power_law_1.2,1.492627239227295
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,7168,2048,8,256,4,2,power_law_1.01,0.07528319954872131
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,7168,2048,8,256,4,2,balanced,0.42720532417297363
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,7168,2048,8,256,4,2,power_law_1.01,0.11398400068283081
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,7168,2048,8,256,4,2,power_law_1.01,0.526694393157959
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,256,2,4,power_law_1.2,2.0314687728881835
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,7168,2048,8,256,4,2,balanced,1.8032479286193848
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,7168,2048,8,256,4,2,balanced,0.4306453466415405
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,7168,2048,8,256,4,2,balanced,1.4905279477437336
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,7168,2048,8,256,4,2,power_law_1.01,0.16707199811935425
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,7168,2048,8,256,4,2,power_law_1.01,0.5599679946899414
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,256,2,4,power_law_1.2,2.954534339904785
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,7168,2048,8,256,4,2,balanced,0.4341386556625366
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,7168,2048,8,256,4,2,power_law_1.01,0.20215680599212646
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,7168,2048,8,256,4,2,power_law_1.01,0.6036992073059082
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,256,2,4,power_law_1.2,4.026591873168945
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,7168,2048,8,256,4,2,power_law_1.01,0.2775935888290405
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,7168,2048,8,256,4,2,balanced,0.442415992418925
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,7168,2048,8,256,4,2,power_law_1.01,0.606009578704834
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,7168,2048,8,256,4,2,power_law_1.01,0.2952192068099976
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,7168,2048,8,256,4,2,balanced,0.4502933422724406
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,7168,2048,8,256,4,2,power_law_1.01,0.635423994064331
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,256,2,4,power_law_1.2,5.065286254882812
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,7168,2048,8,256,4,2,power_law_1.01,0.30424320697784424
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,7168,2048,8,256,4,2,balanced,0.45739734172821045
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,7168,2048,8,256,4,2,balanced,2.529285271962484
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,7168,2048,8,256,4,2,power_law_1.01,0.6502399921417237
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,7168,2048,8,256,4,2,balanced,2.1134506861368814
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,7168,2048,8,256,4,2,power_law_1.01,0.3121664047241211
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,256,2,4,power_law_1.2,6.720531463623047
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,7168,2048,8,256,4,2,balanced,0.47090665499369305
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,7168,2048,8,256,4,2,power_law_1.01,0.6836095809936523
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,7168,2048,8,256,4,2,power_law_1.01,0.32997119426727295
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,7168,2048,8,256,4,2,balanced,0.49001598358154297
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,7168,2048,8,256,4,2,power_law_1.01,0.6981696128845215
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,256,2,4,power_law_1.2,10.851148986816407
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,7168,2048,8,256,4,2,power_law_1.01,0.35921919345855713
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,7168,2048,8,256,4,2,power_law_1.01,0.7297215938568116
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,7168,2048,8,256,4,2,balanced,0.5030986467997233
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,7168,2048,8,256,4,2,power_law_1.01,0.3707007884979248
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,7168,2048,8,256,4,2,power_law_1.01,0.8057344436645508
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,7168,2048,8,256,4,2,power_law_1.01,0.3801599979400635
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,7168,2048,8,256,4,2,balanced,0.5377920071283976
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,256,2,4,power_law_1.2,20.998828125
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,7168,2048,8,256,4,2,power_law_1.01,0.8488384246826172
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,7168,2048,8,256,4,2,power_law_1.01,0.41247358322143557
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,7168,2048,8,256,4,2,power_law_1.01,0.9981247901916503
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,7168,2048,8,256,4,2,balanced,3.317429224650065
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,7168,2048,8,256,4,2,power_law_1.01,0.43627519607543946
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,7168,2048,8,256,4,2,balanced,2.709413210550944
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,7168,2048,8,256,4,2,power_law_1.01,0.9991680145263672
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,7168,2048,8,256,4,2,power_law_1.01,0.44574718475341796
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,7168,2048,8,256,4,2,power_law_1.01,1.1897919654846192
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,7168,2048,8,256,4,2,power_law_1.01,0.5343808174133301
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,7168,2048,8,256,4,2,balanced,0.6277706623077393
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,7168,2048,8,256,4,2,power_law_1.01,1.3641728401184081
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,7168,2048,8,256,4,2,power_law_1.01,0.5439040184020996
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,7168,2048,8,256,4,2,power_law_1.01,0.6463295936584472
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,7168,2048,8,256,4,2,power_law_1.01,1.8215360641479492
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,7168,2048,8,256,4,2,power_law_1.01,0.7144768238067627
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,7168,2048,8,256,4,2,power_law_1.01,2.212665557861328
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,7168,2048,8,256,4,2,power_law_1.01,0.8912832260131835
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,7168,2048,8,256,4,2,power_law_1.01,3.080121612548828
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,7168,2048,8,256,4,2,power_law_1.01,0.09465600252151489
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,7168,2048,8,256,4,2,power_law_1.01,1.0206527709960938
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,7168,2048,8,256,4,2,balanced,4.053584098815918
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,256,4,2,balanced,0.7409813404083252
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,7168,2048,8,256,4,2,power_law_1.01,4.005382537841797
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,7168,2048,8,256,4,2,balanced,3.520970662434896
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,7168,2048,8,256,4,2,power_law_1.01,1.328326416015625
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,7168,2048,8,256,4,2,power_law_1.01,0.11505279541015626
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,7168,2048,8,256,4,2,power_law_1.01,5.008371353149414
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,7168,2048,8,256,4,2,power_law_1.01,0.10115840435028076
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,7168,2048,8,256,4,2,power_law_1.01,1.7158079147338867
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,256,4,2,balanced,0.888970692952474
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,7168,2048,8,256,4,2,power_law_1.01,0.13967360258102418
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,7168,2048,8,256,4,2,power_law_1.01,2.3468799591064453
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,7168,2048,8,256,4,2,power_law_1.01,7.71875228881836
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,256,4,2,balanced,0.9827093283335367
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,7168,2048,8,256,4,2,power_law_1.01,0.17651840448379516
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,7168,2048,8,256,4,2,power_law_1.01,2.987379264831543
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,7168,2048,8,256,4,2,power_law_1.01,0.23893120288848876
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,7168,2048,8,256,4,2,power_law_1.01,14.816064453125
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,7168,2048,8,256,4,2,power_law_1.01,3.8233921051025392
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,7168,2048,8,256,4,2,power_law_1.01,0.31154561042785645
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,256,4,2,balanced,1.3438773155212402
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,7168,2048,8,256,4,2,power_law_1.01,0.3365952014923096
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,7168,2048,8,256,4,2,power_law_1.01,5.838156890869141
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,7168,2048,8,256,4,2,power_law_1.01,0.3480959892272949
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,256,4,2,balanced,1.5778613090515137
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,7168,2048,8,256,4,2,power_law_1.01,0.3602688074111938
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,7168,2048,8,256,4,2,power_law_1.01,11.533299255371094
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,7168,2048,8,256,4,2,power_law_1.01,0.3890944004058838
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,7168,2048,8,256,4,2,power_law_1.01,0.4053311824798584
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,7168,2048,8,256,4,2,balanced,6.502666473388672
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,256,4,2,balanced,2.422767957051595
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,7168,2048,8,256,4,2,balanced,5.290714581807454
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,7168,2048,8,256,4,2,power_law_1.01,0.43073282241821287
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,7168,2048,8,256,4,2,power_law_1.01,0.4622335910797119
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,7168,2048,8,256,4,2,power_law_1.01,0.5119232177734375
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,256,4,2,balanced,2.951823870340983
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,7168,2048,8,256,4,2,power_law_1.01,0.5403456211090087
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,7168,2048,8,256,4,2,power_law_1.01,0.6308800220489502
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,7168,2048,8,256,4,2,power_law_1.01,0.7173120021820069
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,256,4,2,balanced,4.367146809895833
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,256,4,2,power_law_1.01,0.7742527961730957
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,7168,2048,8,256,4,2,power_law_1.2,0.08589439988136291
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,256,4,2,power_law_1.01,0.9520575523376464
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,7168,2048,8,256,4,2,power_law_1.2,0.1183359980583191
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,256,4,2,power_law_1.01,1.1952320098876954
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,7168,2048,8,256,4,2,power_law_1.2,0.09945600032806397
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,7168,2048,8,256,4,2,power_law_1.2,0.1579519987106323
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,256,4,2,power_law_1.01,1.5359935760498047
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,7168,2048,8,256,4,2,power_law_1.2,0.23429760932922364
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,256,4,2,power_law_1.01,1.8732160568237304
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,7168,2048,8,256,4,2,power_law_1.2,0.32965760231018065
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,7168,2048,8,256,4,2,power_law_1.2,0.46482558250427247
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,256,4,2,power_law_1.01,2.719443130493164
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,256,4,2,balanced,5.793301264444987
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,7168,2048,8,256,4,2,power_law_1.2,0.5203519821166992
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,256,4,2,power_law_1.01,3.267628860473633
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,7168,2048,8,256,4,2,power_law_1.2,0.5544767856597901
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,7168,2048,8,256,4,2,power_law_1.2,0.5725823879241944
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,256,4,2,power_law_1.01,4.649856185913086
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,7168,2048,8,256,4,2,power_law_1.2,0.6006207942962647
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,7168,2048,8,256,4,2,power_law_1.2,0.599891185760498
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,256,4,2,power_law_1.01,6.526751708984375
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,7168,2048,8,256,4,2,power_law_1.2,0.61910400390625
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,7168,2048,8,256,4,2,power_law_1.2,0.6740543842315674
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,256,4,2,power_law_1.01,8.024473571777344
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,7168,2048,8,256,4,2,power_law_1.2,0.6860095977783203
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,7168,2048,8,256,4,2,balanced,13.16165288289388
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,7168,2048,8,256,4,2,power_law_1.2,0.7135615825653077
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,7168,2048,8,256,4,2,balanced,10.440959930419922
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,7168,2048,8,256,4,2,power_law_1.2,0.7345280170440673
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,256,4,2,power_law_1.01,12.538803100585938
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,7168,2048,8,256,4,2,power_law_1.2,0.8501824378967285
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,256,4,2,balanced,7.267397562662761
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,7168,2048,8,256,4,2,power_law_1.2,0.9048959732055664
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,7168,2048,8,256,4,2,power_law_1.2,1.0576383590698242
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,256,4,2,power_law_1.01,24.760313415527342
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,7168,2048,8,256,4,2,power_law_1.2,1.0387840270996094
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,7168,2048,8,256,4,2,power_law_1.2,1.2231295585632325
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,7168,2048,8,256,4,2,power_law_1.2,1.5185728073120117
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,7168,2048,8,256,4,2,power_law_1.2,1.8486783981323243
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,7168,2048,8,256,4,2,power_law_1.2,2.5980735778808595
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,7168,2048,8,256,4,2,power_law_1.2,3.2177024841308595
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,7168,2048,8,256,4,2,power_law_1.2,4.057638549804688
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,7168,2048,8,256,4,2,power_law_1.2,4.933318328857422
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,7168,2048,8,256,4,2,power_law_1.2,8.026541137695313
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,7168,2048,8,256,4,2,power_law_1.2,16.086207580566406
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,256,4,2,balanced,11.61130142211914
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,7168,2048,8,256,4,2,power_law_1.2,0.06556159853935242
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,7168,2048,8,256,4,2,power_law_1.2,0.08387839794158936
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,7168,2048,8,256,4,2,power_law_1.2,0.07379199862480164
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,7168,2048,8,256,4,2,power_law_1.2,0.11398400068283081
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,7168,2048,8,256,4,2,power_law_1.2,0.15164799690246583
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,7168,2048,8,256,4,2,power_law_1.2,0.19872000217437744
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,7168,2048,8,256,4,2,power_law_1.2,0.28108160495758056
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,7168,2048,8,256,4,2,power_law_1.2,0.2948415994644165
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,7168,2048,8,256,4,2,power_law_1.2,0.3099008083343506
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,7168,2048,8,256,4,2,power_law_1.2,0.32390398979187013
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,256,4,2,balanced,23.320810953776043
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,7168,2048,8,256,4,2,power_law_1.2,0.33395841121673586
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,7168,2048,8,256,4,2,power_law_1.2,0.3483968019485474
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,7168,2048,8,256,4,2,power_law_1.2,0.37032959461212156
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,7168,2048,8,256,4,2,power_law_1.2,0.3919615983963013
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,7168,2048,8,256,8,1,balanced,0.07124799986680348
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,7168,2048,8,256,4,2,power_law_1.2,0.42225279808044436
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,7168,2048,8,256,8,1,balanced,0.08850133419036865
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,7168,2048,8,256,4,2,power_law_1.2,0.45228800773620603
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,7168,2048,8,256,8,1,balanced,0.1316266655921936
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,7168,2048,8,256,4,2,power_law_1.2,0.46811518669128416
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,7168,2048,8,256,8,1,balanced,0.2166879971822103
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,7168,2048,8,256,4,2,power_law_1.2,0.09388160109519958
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,7168,2048,8,256,8,1,balanced,0.3967946767807007
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,7168,2048,8,256,4,2,power_law_1.2,0.5379968166351319
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,7168,2048,8,256,4,2,power_law_1.2,0.11152000427246093
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,7168,2048,8,256,8,1,balanced,0.7135519981384277
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,7168,2048,8,256,4,2,power_law_1.2,0.5692800045013428
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,7168,2048,8,256,4,2,power_law_1.2,0.10321919918060303
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,7168,2048,8,256,8,1,balanced,0.7238346735636393
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,7168,2048,8,256,4,2,power_law_1.2,0.6840256214141845
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,7168,2048,8,256,8,1,balanced,0.7340106964111328
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,7168,2048,8,256,4,2,power_law_1.2,0.13731199502944946
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,7168,2048,8,256,4,2,power_law_1.2,0.7609600067138672
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,7168,2048,8,256,8,1,balanced,0.7313600381215414
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,7168,2048,8,256,4,2,power_law_1.2,0.17493760585784912
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,7168,2048,8,256,4,2,power_law_1.2,0.9275327682495117
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,7168,2048,8,256,8,1,balanced,0.7453333536783854
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,7168,2048,8,256,4,2,power_law_1.2,1.0826111793518067
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,7168,2048,8,256,4,2,power_law_1.2,0.2182528018951416
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,7168,2048,8,256,8,1,balanced,0.745749314626058
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,7168,2048,8,256,8,1,balanced,0.7531306743621826
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,7168,2048,8,256,4,2,power_law_1.2,0.3091520071029663
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,7168,2048,8,256,4,2,power_law_1.2,1.432767963409424
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,7168,2048,8,256,8,1,balanced,0.7583306630452474
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,7168,2048,8,256,4,2,power_law_1.2,0.3341504096984863
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,7168,2048,8,256,4,2,power_law_1.2,1.7875839233398438
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,7168,2048,8,256,8,1,balanced,0.7711733182271322
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,7168,2048,8,256,4,2,power_law_1.2,0.3400896072387695
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,7168,2048,8,256,4,2,power_law_1.2,2.524799919128418
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,7168,2048,8,256,8,1,balanced,0.7859466870625814
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,7168,2048,8,256,4,2,power_law_1.2,0.36097919940948486
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,7168,2048,8,256,4,2,power_law_1.2,3.2583999633789062
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,7168,2048,8,256,8,1,balanced,0.7995146910349528
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,7168,2048,8,256,4,2,power_law_1.2,0.3750463962554932
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,7168,2048,8,256,8,1,balanced,0.7975839773813883
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,7168,2048,8,256,4,2,power_law_1.2,4.010784149169922
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,7168,2048,8,256,4,2,power_law_1.2,0.4102464199066162
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,7168,2048,8,256,8,1,balanced,0.8720373312632242
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,7168,2048,8,256,4,2,power_law_1.2,0.4302847862243652
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,7168,2048,8,256,4,2,power_law_1.2,6.423014068603516
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,7168,2048,8,256,8,1,balanced,0.9388480186462402
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,7168,2048,8,256,4,2,power_law_1.2,0.4804096221923828
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,7168,2048,8,256,4,2,power_law_1.2,0.5189824104309082
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,7168,2048,8,256,8,1,balanced,1.0393599669138591
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,7168,2048,8,256,4,2,power_law_1.2,12.970124816894531
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,7168,2048,8,256,4,2,power_law_1.2,0.550867223739624
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,7168,2048,8,256,4,2,power_law_1.2,0.6410624027252197
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,7168,2048,8,256,8,1,balanced,1.1965546607971191
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,7168,2048,8,256,8,1,balanced,1.3729066848754883
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,7168,2048,8,256,8,1,balanced,0.05968533456325531
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,7168,2048,8,256,4,2,power_law_1.2,0.7455679893493652
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,7168,2048,8,256,8,1,balanced,0.07092266778151195
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,7168,2048,8,256,8,1,balanced,1.5657226244608562
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,7168,2048,8,256,8,1,balanced,0.09572266538937886
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,256,4,2,power_law_1.2,0.8139967918395996
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,7168,2048,8,256,8,1,balanced,0.14845866958300272
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,256,4,2,power_law_1.2,1.0404864311218263
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,7168,2048,8,256,8,1,balanced,0.24766399463017783
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,256,4,2,power_law_1.2,1.217625617980957
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,7168,2048,8,256,8,1,balanced,2.131962617238363
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,7168,2048,8,256,8,1,balanced,0.4426720142364502
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,256,4,2,power_law_1.2,1.6161792755126954
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,7168,2048,8,256,8,1,balanced,0.4466079870859782
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,7168,2048,8,256,8,1,balanced,0.45180265108744305
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,256,4,2,power_law_1.2,1.8895679473876954
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,7168,2048,8,256,8,1,balanced,0.45866668224334717
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,256,4,2,power_law_1.2,2.6963008880615233
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,7168,2048,8,256,8,1,power_law_1.01,0.06716160178184509
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,7168,2048,8,256,8,1,balanced,2.5685067176818848
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,7168,2048,8,256,8,1,balanced,0.4614559809366862
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,256,4,2,power_law_1.2,3.483327865600586
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,7168,2048,8,256,8,1,power_law_1.01,0.08542079925537109
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,7168,2048,8,256,8,1,balanced,0.47144532203674316
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,7168,2048,8,256,8,1,balanced,0.4820479949315389
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,7168,2048,8,256,8,1,power_law_1.01,0.10160000324249267
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,256,4,2,power_law_1.2,5.323392105102539
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,7168,2048,8,256,8,1,balanced,0.4906453291575114
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,7168,2048,8,256,8,1,power_law_1.01,0.17786879539489747
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,7168,2048,8,256,8,1,power_law_1.01,0.055327999591827395
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,256,4,2,power_law_1.2,6.775513458251953
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,7168,2048,8,256,8,1,balanced,0.1272266705830892
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,7168,2048,8,256,8,1,balanced,0.5091840028762817
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,7168,2048,8,256,8,1,power_law_1.01,0.2713151931762695
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,7168,2048,8,256,8,1,power_law_1.01,0.06804479956626892
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,7168,2048,8,256,8,1,balanced,3.6195360819498696
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,7168,2048,8,256,8,1,power_law_1.01,0.07619199752807618
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,256,4,2,power_law_1.2,8.195993804931641
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,7168,2048,8,256,8,1,balanced,0.1367733379205068
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,7168,2048,8,256,8,1,power_law_1.01,0.3647104024887085
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,7168,2048,8,256,8,1,balanced,0.5260213216145834
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,7168,2048,8,256,8,1,power_law_1.01,0.11951999664306641
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,7168,2048,8,256,8,1,balanced,0.15503999590873718
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,7168,2048,8,256,8,1,power_law_1.01,0.17235200405120848
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,7168,2048,8,256,8,1,power_law_1.01,0.5071231842041015
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,7168,2048,8,256,8,1,balanced,0.5419093370437622
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,7168,2048,8,256,8,1,power_law_1.01,0.22631680965423584
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,7168,2048,8,256,8,1,balanced,0.2144426703453064
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,256,4,2,power_law_1.2,13.685658264160157
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,7168,2048,8,256,8,1,power_law_1.01,0.5327040195465088
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,7168,2048,8,256,8,1,power_law_1.01,0.3217152118682861
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,7168,2048,8,256,8,1,balanced,0.5647626717885336
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,7168,2048,8,256,8,1,balanced,0.3102933367093404
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,7168,2048,8,256,8,1,power_law_1.01,0.3357759952545166
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,7168,2048,8,256,8,1,power_law_1.01,0.5511744022369385
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,7168,2048,8,256,8,1,balanced,0.5073813199996948
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,7168,2048,8,256,8,1,balanced,0.600879987080892
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,7168,2048,8,256,8,1,power_law_1.01,0.34980480670928954
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,7168,2048,8,256,8,1,balanced,0.5155413150787354
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,7168,2048,8,256,8,1,power_law_1.01,0.36370561122894285
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,7168,2048,8,256,8,1,power_law_1.01,0.5738368034362793
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,256,4,2,power_law_1.2,26.214175415039062
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,7168,2048,8,256,8,1,balanced,0.6844533284505209
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,7168,2048,8,256,8,1,power_law_1.01,0.3915776014328003
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,7168,2048,8,256,8,1,balanced,0.5278506676355997
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,7168,2048,8,256,8,1,power_law_1.01,0.619539213180542
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,7168,2048,8,256,8,1,power_law_1.01,0.4068352222442627
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,7168,2048,8,256,8,1,balanced,4.5797119140625
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,7168,2048,8,256,8,1,balanced,0.5349066654841105
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,7168,2048,8,256,8,1,power_law_1.01,0.4303999900817871
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,7168,2048,8,256,8,1,balanced,0.7970506350199381
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,7168,2048,8,256,8,1,power_law_1.01,0.6653056144714355
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,7168,2048,8,256,8,1,balanced,0.5376319885253906
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,7168,2048,8,256,8,1,power_law_1.01,0.4537536144256592
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,7168,2048,8,256,8,1,balanced,0.5500906705856323
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,7168,2048,8,256,8,1,power_law_1.01,0.49643521308898925
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,7168,2048,8,256,8,1,power_law_1.01,0.6869823932647705
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,7168,2048,8,256,8,1,balanced,0.8437493642171224
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,7168,2048,8,256,8,1,power_law_1.01,0.5242623805999755
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,7168,2048,8,256,8,1,balanced,0.5687253475189209
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,7168,2048,8,256,8,1,power_law_1.01,0.7142528057098388
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,7168,2048,8,256,8,1,power_law_1.01,0.538912010192871
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,7168,2048,8,256,8,1,balanced,0.5847626527150472
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,7168,2048,8,256,8,1,power_law_1.01,0.6237823963165283
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,7168,2048,8,256,8,1,power_law_1.01,0.7376192092895508
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,7168,2048,8,256,8,1,balanced,1.0469280083974202
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,7168,2048,8,256,8,1,power_law_1.01,0.6865536212921143
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,7168,2048,8,256,8,1,balanced,0.6071999867757162
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,7168,2048,8,256,8,1,power_law_1.01,0.7767680168151856
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,7168,2048,8,256,8,1,power_law_1.01,0.8376704216003418
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,7168,2048,8,256,8,1,balanced,0.6538346608479818
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,7168,2048,8,256,8,1,power_law_1.01,0.8866815567016602
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,7168,2048,8,256,8,1,power_law_1.01,0.7844480037689209
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,7168,2048,8,256,8,1,balanced,0.6887306372324625
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,7168,2048,8,256,8,1,balanced,1.2624159653981526
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,7168,2048,8,256,8,1,power_law_1.01,1.114572811126709
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,7168,2048,8,256,8,1,balanced,5.985776265462239
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,7168,2048,8,256,8,1,power_law_1.01,0.905247974395752
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,7168,2048,8,256,8,1,power_law_1.01,1.3395456314086913
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,7168,2048,8,256,8,1,balanced,0.7363466421763102
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,7168,2048,8,256,8,1,power_law_1.01,0.9766464233398438
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,7168,2048,8,256,8,1,power_law_1.01,1.8178495407104491
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,7168,2048,8,256,8,1,power_law_1.01,2.289651107788086
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,7168,2048,8,256,8,1,power_law_1.01,1.1476415634155273
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,7168,2048,8,256,8,1,balanced,1.7933173179626465
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,7168,2048,8,256,8,1,power_law_1.01,3.265990447998047
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,7168,2048,8,256,8,1,power_law_1.01,1.1896384239196778
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,7168,2048,8,256,8,1,power_law_1.01,4.224825668334961
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,7168,2048,8,256,8,1,balanced,0.8920479615529379
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,7168,2048,8,256,8,1,power_law_1.01,1.4341631889343263
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,7168,2048,8,256,8,1,power_law_1.01,5.1802623748779295
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,7168,2048,8,256,8,1,power_law_1.01,1.6873088836669923
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,7168,2048,8,256,8,1,balanced,2.2578293482462564
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,7168,2048,8,256,8,1,power_law_1.01,7.91167984008789
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,7168,2048,8,256,8,1,power_law_1.01,2.2071807861328123
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,7168,2048,8,256,8,1,power_law_1.01,2.71713924407959
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,7168,2048,8,256,8,1,power_law_1.01,15.459884643554688
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,256,8,1,balanced,1.1176053682963054
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,7168,2048,8,256,8,1,power_law_1.01,3.7805824279785156
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,256,8,1,balanced,1.3971734046936035
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,7168,2048,8,256,8,1,power_law_1.01,4.833055877685547
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,7168,2048,8,256,8,1,balanced,3.279535929361979
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,7168,2048,8,256,8,1,balanced,8.964239756266275
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,256,8,1,balanced,1.549498716990153
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,7168,2048,8,256,8,1,power_law_1.01,5.9108222961425785
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,7168,2048,8,256,8,1,power_law_1.01,0.11335680484771729
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,7168,2048,8,256,8,1,power_law_1.01,0.12513279914855957
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,256,8,1,balanced,2.2341866493225098
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,7168,2048,8,256,8,1,power_law_1.01,9.206451416015625
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,7168,2048,8,256,8,1,power_law_1.01,0.13992960453033448
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,7168,2048,8,256,8,1,power_law_1.01,0.18807040452957152
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,7168,2048,8,256,8,1,power_law_1.01,0.2375744104385376
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,256,8,1,balanced,2.667311986287435
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,7168,2048,8,256,8,1,power_law_1.01,17.49516143798828
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,7168,2048,8,256,8,1,power_law_1.01,0.29241600036621096
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,7168,2048,8,256,8,1,balanced,4.074463844299316
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,7168,2048,8,256,8,1,power_law_1.01,0.38471040725708006
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,7168,2048,8,256,8,1,power_law_1.01,0.4095168113708496
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,256,8,1,balanced,4.217119852701823
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,7168,2048,8,256,8,1,power_law_1.01,0.42933120727539065
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,7168,2048,8,256,8,1,power_law_1.01,0.44954237937927244
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,7168,2048,8,256,8,1,power_law_1.01,0.47823362350463866
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,7168,2048,8,256,8,1,power_law_1.01,0.5103744029998779
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,256,8,1,balanced,5.178874651590983
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,7168,2048,8,256,8,1,power_law_1.01,0.5393472194671631
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,7168,2048,8,256,8,1,power_law_1.01,0.6088768005371094
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,7168,2048,8,256,8,1,balanced,5.377285639444987
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,7168,2048,8,256,8,1,power_law_1.01,0.6747712135314942
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,7168,2048,8,256,8,1,power_law_1.01,0.735097599029541
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,7168,2048,8,256,8,1,power_law_1.01,0.8489536285400391
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,256,8,1,balanced,7.628032048543294
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,7168,2048,8,256,8,1,power_law_1.01,1.0204095840454102
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,256,8,1,power_law_1.01,1.1269887924194335
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,7168,2048,8,256,8,1,balanced,17.410879770914715
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,256,8,1,power_law_1.01,1.4524736404418945
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,256,8,1,balanced,10.061445236206055
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,256,8,1,power_law_1.01,1.7702272415161133
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,256,8,1,power_law_1.01,2.34192008972168
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,7168,2048,8,256,8,1,power_law_1.2,0.06842880249023438
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,7168,2048,8,256,8,1,balanced,7.805477142333984
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,256,8,1,power_law_1.01,2.925823974609375
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,7168,2048,8,256,8,1,power_law_1.2,0.08329600095748901
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,256,8,1,power_law_1.01,4.142476654052734
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,7168,2048,8,256,8,1,power_law_1.2,0.10246399641036988
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,256,8,1,power_law_1.01,5.366144180297852
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,7168,2048,8,256,8,1,power_law_1.2,0.1647487998008728
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,7168,2048,8,256,8,1,power_law_1.2,0.24979839324951172
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,256,8,1,power_law_1.01,7.787039947509766
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,7168,2048,8,256,8,1,power_law_1.2,0.31456000804901124
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,256,8,1,balanced,12.468266805013021
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,256,8,1,power_law_1.01,10.199110412597657
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,7168,2048,8,256,8,1,power_law_1.2,0.4980288028717041
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,7168,2048,8,256,8,1,power_law_1.2,0.5248511791229248
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,256,8,1,power_law_1.01,12.628972625732422
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,7168,2048,8,256,8,1,power_law_1.2,0.5452288150787353
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,7168,2048,8,256,8,1,power_law_1.2,0.5952383995056152
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,256,8,1,power_law_1.01,19.935487365722658
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,7168,2048,8,256,8,1,power_law_1.2,0.628768014907837
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,7168,2048,8,256,8,1,power_law_1.2,0.6585023880004883
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,7168,2048,8,256,8,1,power_law_1.2,0.6904895782470704
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,256,8,1,power_law_1.01,39.2293701171875
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,7168,2048,8,256,8,1,power_law_1.2,0.7160511970520019
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,7168,2048,8,256,8,1,power_law_1.2,0.7707712173461914
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,7168,2048,8,256,8,1,power_law_1.2,0.8420479774475098
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,7168,2048,8,256,8,1,power_law_1.2,0.8176575660705566
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,256,8,1,balanced,19.875221252441406
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,7168,2048,8,256,8,1,power_law_1.2,0.940345573425293
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,7168,2048,8,256,8,1,power_law_1.2,1.028486442565918
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,7168,2048,8,256,8,1,power_law_1.2,0.055878400802612305
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,7168,2048,8,256,8,1,power_law_1.2,1.2018239974975586
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,7168,2048,8,256,8,1,power_law_1.2,0.06739839911460876
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,7168,2048,8,256,8,1,power_law_1.2,1.2510080337524414
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,7168,2048,8,256,8,1,power_law_1.2,0.07591040134429931
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,7168,2048,8,256,8,1,balanced,15.35977554321289
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,7168,2048,8,256,8,1,power_law_1.2,0.11498240232467652
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,7168,2048,8,256,8,1,power_law_1.2,1.5075136184692384
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,7168,2048,8,256,8,1,power_law_1.2,0.16092159748077392
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,7168,2048,8,256,8,1,power_law_1.2,1.7512256622314453
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,7168,2048,8,256,8,1,power_law_1.2,0.20794239044189453
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,7168,2048,8,256,8,1,power_law_1.2,2.2690752029418944
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,7168,2048,8,256,8,1,power_law_1.2,0.3152384042739868
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,7168,2048,8,256,8,1,power_law_1.2,2.7784576416015625
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,7168,2048,8,256,8,1,power_law_1.2,0.3252351999282837
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,7168,2048,8,256,8,1,power_law_1.2,3.841843032836914
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,7168,2048,8,256,8,1,power_law_1.2,0.3504256010055542
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,7168,2048,8,256,8,1,power_law_1.2,0.36506240367889403
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,7168,2048,8,256,8,1,power_law_1.2,5.092441558837891
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,7168,2048,8,256,8,1,power_law_1.2,0.38667519092559816
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,7168,2048,8,256,8,1,power_law_1.2,6.365017700195312
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,7168,2048,8,256,8,1,power_law_1.2,0.41850881576538085
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,7168,2048,8,256,8,1,power_law_1.2,0.4356224060058594
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,7168,2048,8,256,8,1,power_law_1.2,9.869152069091797
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,7168,2048,8,256,8,1,power_law_1.2,0.4547840118408203
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,7168,2048,8,256,8,1,power_law_1.2,0.5064832210540772
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,7168,2048,8,256,8,1,power_law_1.2,17.555014038085936
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,7168,2048,8,256,8,1,power_law_1.2,0.5465919971466064
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,7168,2048,8,256,8,1,power_law_1.2,0.5473536014556885
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,7168,2048,8,256,8,1,power_law_1.2,0.6468992233276367
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,7168,2048,8,256,8,1,power_law_1.2,0.7113920211791992
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,7168,2048,8,256,8,1,power_law_1.2,0.8582528114318848
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,7168,2048,8,256,8,1,power_law_1.2,0.11303039789199829
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,256,8,1,balanced,39.77020772298177
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,7168,2048,8,256,8,1,power_law_1.2,0.9432064056396484
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,7168,2048,8,256,8,1,power_law_1.2,1.1698368072509766
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,7168,2048,8,256,8,1,power_law_1.2,0.12595200538635254
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,7168,2048,8,256,8,1,power_law_1.2,1.3607359886169434
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,7168,2048,8,256,8,1,power_law_1.2,0.14024959802627562
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,2048,768,8,128,1,8,balanced,0.028351999819278717
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,7168,2048,8,256,8,1,power_law_1.2,0.1779263973236084
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,7168,2048,8,256,8,1,power_law_1.2,1.8347455978393554
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,2048,768,8,128,1,8,balanced,0.02861333390076955
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,7168,2048,8,256,8,1,power_law_1.2,0.22473599910736083
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,7168,2048,8,256,8,1,power_law_1.2,2.324179267883301
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,2048,768,8,128,1,8,balanced,0.03234666585922241
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,7168,2048,8,256,8,1,power_law_1.2,0.27173120975494386
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,2048,768,8,128,1,8,balanced,0.04435733457406362
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,7168,2048,8,256,8,1,power_law_1.2,3.309203338623047
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,7168,2048,8,256,8,1,power_law_1.2,0.38029439449310304
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,2048,768,8,128,1,8,balanced,0.06099733213583628
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,7168,2048,8,256,8,1,power_law_1.2,4.2358142852783205
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,7168,2048,8,256,8,1,power_law_1.2,0.39962880611419677
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,2048,768,8,128,1,8,balanced,0.05871466795603434
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,7168,2048,8,256,8,1,power_law_1.2,0.43116159439086915
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,2048,768,8,128,1,8,balanced,0.06084266801675161
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,7168,2048,8,256,8,1,power_law_1.2,5.234163284301758
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,2048,768,8,128,1,8,balanced,0.060645331939061485
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,7168,2048,8,256,8,1,power_law_1.2,0.4400576114654541
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,2048,768,8,128,1,8,balanced,0.05806399881839752
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,7168,2048,8,256,8,1,power_law_1.2,0.47981438636779783
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,7168,2048,8,256,8,1,power_law_1.2,7.900358581542969
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,2048,768,8,128,1,8,balanced,0.061306665341059365
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,7168,2048,8,256,8,1,power_law_1.2,0.5144192218780518
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,2048,768,8,128,1,8,balanced,0.06020799775918325
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,7168,2048,8,256,8,1,power_law_1.2,0.5481535911560058
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,7168,2048,8,256,8,1,power_law_1.2,15.378477478027344
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,2048,768,8,128,1,8,balanced,0.061333333452542625
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,7168,2048,8,256,8,1,power_law_1.2,0.6248511791229248
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,2048,768,8,128,1,8,balanced,0.0621066689491272
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,7168,2048,8,256,8,1,power_law_1.2,0.6962624073028565
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,2048,768,8,128,1,8,balanced,0.06242666641871134
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,7168,2048,8,256,8,1,power_law_1.2,0.7522175788879395
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,2048,768,8,128,1,8,balanced,0.06770133475462596
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,7168,2048,8,256,8,1,power_law_1.2,0.863584041595459
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,2048,768,8,128,1,8,balanced,0.07057066758473714
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,2048,768,8,128,1,8,balanced,0.07153066496054332
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,2048,768,8,128,1,8,balanced,0.07748800019423167
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,7168,2048,8,256,8,1,power_law_1.2,1.0302656173706055
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,2048,768,8,128,1,8,balanced,0.031770666440327965
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,2048,768,8,128,1,8,balanced,0.08880533774693807
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,2048,768,8,128,1,8,balanced,0.03223466624816259
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,2048,768,8,128,1,8,balanced,0.09447466333707173
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,256,8,1,power_law_1.2,1.1358271598815919
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,2048,768,8,128,1,8,balanced,0.03283733377854029
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,2048,768,8,128,1,8,balanced,0.035088000198205314
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,256,8,1,power_law_1.2,1.4615936279296875
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,2048,768,8,128,1,8,balanced,0.10230400164922078
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,2048,768,8,128,1,8,balanced,0.05250666538874308
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,256,8,1,power_law_1.2,1.7744192123413085
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,2048,768,8,128,1,8,balanced,0.054325332244237266
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,2048,768,8,128,1,8,balanced,0.12315733234087627
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,256,8,1,power_law_1.2,2.3805376052856446
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,2048,768,8,128,1,8,balanced,0.0539626677831014
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,256,8,1,power_law_1.2,2.9722112655639648
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,2048,768,8,128,1,8,balanced,0.05398400127887726
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,2048,768,8,128,1,8,balanced,0.13551466663678488
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,2048,768,8,128,1,8,balanced,0.05422399938106537
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,256,8,1,power_law_1.2,4.180684661865234
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,2048,768,8,128,1,8,balanced,0.05472533404827118
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,256,8,1,power_law_1.2,5.401900863647461
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,2048,768,8,128,1,8,balanced,0.05509866774082184
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,2048,768,8,128,1,8,balanced,0.05602666735649109
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,2048,768,8,128,1,8,balanced,0.18281600872675577
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,256,8,1,power_law_1.2,7.823334503173828
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,2048,768,8,128,1,8,balanced,0.057162667314211525
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,2048,768,8,128,1,8,balanced,0.05824000140031179
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,256,8,1,power_law_1.2,10.220825958251954
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,2048,768,8,128,1,8,balanced,0.06267199913660686
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,2048,768,8,128,1,8,balanced,0.20470933119455972
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,2048,768,8,128,1,8,balanced,0.06145066519578298
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,256,8,1,power_law_1.2,12.648492431640625
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,2048,768,8,128,1,8,balanced,0.06544533371925354
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,2048,768,8,128,1,8,balanced,0.07029333213965099
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,256,8,1,power_law_1.2,19.900262451171876
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,2048,768,8,128,1,8,balanced,0.07548800110816956
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,2048,768,8,128,1,8,balanced,0.08247999846935272
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,2048,768,8,128,1,8,balanced,0.29999999205271405
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,256,8,1,power_law_1.2,39.37269897460938
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,2048,768,8,128,1,8,balanced,0.09078933795293172
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,2048,768,8,128,1,8,balanced,0.12043199936548869
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,2048,768,8,128,1,8,balanced,0.1350826621055603
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,2048,768,8,128,1,8,balanced,0.3736000061035156
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,2048,768,8,128,1,8,balanced,0.02588266630967458
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,2048,768,8,128,1,8,balanced,0.027061333258946735
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,2048,768,8,128,1,8,power_law_1.01,0.04420480132102966
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,2048,768,8,128,1,8,balanced,0.18438933293024698
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,2048,768,8,128,1,8,balanced,0.028399998943010967
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,2048,768,8,128,1,8,power_law_1.01,0.035104000568389894
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,2048,768,8,128,1,8,balanced,0.031397332747777305
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,2048,768,8,128,1,8,balanced,0.04667200148105621
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,2048,768,8,128,1,8,power_law_1.01,0.03380480110645294
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,2048,768,8,128,1,8,balanced,0.047797332207361855
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,2048,768,8,128,1,8,power_law_1.01,0.04301440119743347
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,2048,768,8,128,1,8,balanced,0.047872001926104225
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,2048,768,8,128,1,8,power_law_1.01,0.046239998936653134
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,2048,768,8,128,1,8,balanced,0.04846400022506714
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,2048,768,8,128,1,8,power_law_1.01,0.053011202812194826
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,2048,768,8,128,1,8,balanced,0.22402133544286093
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,2048,768,8,128,1,8,power_law_1.01,0.0566976010799408
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,2048,768,8,128,1,8,balanced,0.0487413356701533
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,2048,768,8,128,1,8,power_law_1.01,0.05617920160293579
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,2048,768,8,128,1,8,balanced,0.04953599969546
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,2048,768,8,128,1,8,balanced,0.4718240102132161
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,2048,768,8,128,1,8,power_law_1.01,0.05633919835090637
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,2048,768,8,128,1,8,balanced,0.04978133241335551
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,2048,768,8,128,1,8,power_law_1.01,0.0581055998802185
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,2048,768,8,128,1,8,balanced,0.05161599814891815
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,2048,768,8,128,1,8,power_law_1.01,0.06238080263137817
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,2048,768,8,128,1,8,balanced,0.05271466573079427
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,2048,768,8,128,1,8,power_law_1.01,0.06698880195617676
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,2048,768,8,128,1,8,balanced,0.053258667389551796
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,2048,768,8,128,1,8,balanced,0.3277920087178548
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,2048,768,8,128,1,8,power_law_1.01,0.07131519913673401
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,2048,768,8,128,1,8,power_law_1.01,0.07541760206222534
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,2048,768,8,128,1,8,power_law_1.01,0.07862399816513062
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,2048,768,8,128,1,8,power_law_1.01,0.08375679850578308
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,2048,768,8,128,1,8,balanced,0.05983466903368632
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,2048,768,8,128,1,8,power_law_1.01,0.08712319731712341
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,2048,768,8,128,1,8,power_law_1.01,0.03824639916419983
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,2048,768,8,128,1,8,power_law_1.01,0.10399999618530273
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,2048,768,8,128,1,8,balanced,0.059706668059031166
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,2048,768,8,128,1,8,power_law_1.01,0.11125760078430176
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,2048,768,8,128,1,8,power_law_1.01,0.03281280100345611
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,2048,768,8,128,1,8,power_law_1.01,0.12691199779510498
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,2048,768,8,128,1,8,power_law_1.01,0.03296000063419342
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,2048,768,8,128,1,8,power_law_1.01,0.1493824005126953
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,2048,768,8,128,1,8,balanced,0.41657066345214844
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,2048,768,8,128,1,8,power_law_1.01,0.21109120845794677
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,2048,768,8,128,1,8,power_law_1.01,0.03777279853820801
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,2048,768,8,128,1,8,power_law_1.01,0.21568000316619873
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,2048,768,8,128,1,8,power_law_1.01,0.041440001130104064
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,2048,768,8,128,1,8,power_law_1.01,0.25651841163635253
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,2048,768,8,128,1,8,power_law_1.01,0.05108479857444763
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,2048,768,8,128,1,8,power_law_1.01,0.37574400901794436
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,2048,768,8,128,1,8,power_law_1.01,0.052198398113250735
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,2048,768,8,128,1,8,balanced,0.06474133332570393
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,2048,768,8,128,1,8,balanced,0.7137973308563232
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,2048,768,8,128,1,8,power_law_1.01,0.5276415824890137
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,2048,768,8,128,1,8,power_law_1.01,0.05304960012435913
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,2048,768,8,128,1,8,power_law_1.01,0.6616767883300781
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,2048,768,8,128,1,8,balanced,0.07299200197060902
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,2048,768,8,128,1,8,power_law_1.01,0.053324800729751584
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,2048,768,8,128,1,8,power_law_1.01,0.7862656116485596
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,2048,768,8,128,1,8,power_law_1.01,0.05480319857597351
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,2048,768,8,128,1,8,balanced,0.07502399881680806
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,2048,768,8,128,1,8,power_law_1.01,1.2599488258361817
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,2048,768,8,128,1,8,power_law_1.01,0.055622398853302
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,2048,768,8,128,1,8,power_law_1.01,0.03078399896621704
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,2048,768,8,128,1,8,power_law_1.01,0.056358402967453
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,2048,768,8,128,1,8,power_law_1.01,2.5802560806274415
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,2048,768,8,128,1,8,power_law_1.01,0.029382398724555968
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,2048,768,8,128,1,8,power_law_1.01,0.060140800476074216
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,2048,768,8,128,1,8,balanced,0.5209013223648071
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,2048,768,8,128,1,8,power_law_1.01,0.06077439785003662
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,2048,768,8,128,1,8,power_law_1.01,0.029849600791931153
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,2048,768,8,128,1,8,balanced,0.09292800227801006
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,2048,768,8,128,1,8,power_law_1.01,0.0674239993095398
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,2048,768,8,128,1,8,power_law_1.01,0.035231998562812804
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,2048,768,8,128,1,8,power_law_1.01,0.06986879706382751
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,2048,768,8,128,1,8,balanced,0.10300266742706299
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,2048,768,8,128,1,8,power_law_1.01,0.03715839982032776
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,2048,768,8,128,1,8,power_law_1.01,0.07112320065498352
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,2048,768,8,128,1,8,power_law_1.01,0.04584319889545441
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,2048,768,8,128,1,8,power_law_1.01,0.0819711983203888
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,2048,768,8,128,1,8,balanced,0.1431893308957418
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,2048,768,8,128,1,8,power_law_1.01,0.09488639831542969
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,2048,768,8,128,1,8,power_law_1.01,0.04767360091209412
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,2048,768,8,128,1,8,power_law_1.01,0.10762239694595337
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,2048,768,8,128,1,8,power_law_1.01,0.048467200994491574
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,2048,768,8,128,1,8,power_law_1.01,0.1235967993736267
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,2048,768,8,128,1,8,balanced,0.16421866416931152
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,2048,768,8,128,1,8,power_law_1.01,0.04870400130748749
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,2048,768,8,128,1,8,power_law_1.01,0.16401920318603516
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,2048,768,8,128,1,8,power_law_1.01,0.05030400156974792
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,2048,768,8,128,1,8,power_law_1.01,0.19791359901428224
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,2048,768,8,128,1,8,power_law_1.2,0.04305280148983002
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,2048,768,8,128,1,8,power_law_1.01,0.05459840297698974
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,2048,768,8,128,1,8,power_law_1.01,0.2534976005554199
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,2048,768,8,128,1,8,power_law_1.2,0.03111039996147156
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,2048,768,8,128,1,8,power_law_1.01,0.058406400680541995
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,2048,768,8,128,1,8,power_law_1.01,0.3316159963607788
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,2048,768,8,128,1,8,power_law_1.2,0.03368319869041443
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,2048,768,8,128,1,8,power_law_1.01,0.05976319909095764
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,2048,768,8,128,1,8,balanced,0.7911626497904459
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,2048,768,8,128,1,8,power_law_1.01,0.4660160064697266
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,2048,768,8,128,1,8,power_law_1.2,0.04100480079650879
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,2048,768,8,128,1,8,power_law_1.01,0.0639680027961731
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,2048,768,8,128,1,8,power_law_1.01,0.6352511882781983
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,2048,768,8,128,1,8,balanced,0.23730132977167764
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,2048,768,8,128,1,8,power_law_1.2,0.04110719859600067
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,2048,768,8,128,1,8,power_law_1.2,0.05491840243339539
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,2048,768,8,128,1,8,power_law_1.01,0.8515775680541993
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,2048,768,8,128,1,8,power_law_1.2,0.05688959956169128
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,2048,768,8,128,1,8,power_law_1.01,0.06991999745368957
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,2048,768,8,128,1,8,power_law_1.2,0.059487998485565186
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,2048,768,8,128,1,8,power_law_1.01,1.1984831809997558
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,2048,768,8,128,1,8,power_law_1.01,0.0759872019290924
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,2048,768,8,128,1,8,power_law_1.2,0.0590719997882843
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,2048,768,8,128,1,8,balanced,0.31617067257563275
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,2048,768,8,128,1,8,power_law_1.2,0.06175360083580017
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,2048,768,8,128,1,8,power_law_1.01,2.45743350982666
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,2048,768,8,128,1,8,power_law_1.2,0.06719359755516052
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,2048,768,8,128,1,8,balanced,1.3670506477355957
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,2048,768,8,128,1,8,power_law_1.01,0.0784063994884491
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,2048,768,8,128,1,8,power_law_1.2,0.06681600213050842
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,2048,768,8,128,1,8,power_law_1.01,0.08906239867210389
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,2048,768,8,128,1,8,power_law_1.2,0.07278079986572265
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,2048,768,8,128,1,8,power_law_1.01,0.10338560342788697
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,2048,768,8,128,1,8,power_law_1.2,0.07370880246162415
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,2048,768,8,128,1,8,balanced,0.4645920197168986
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,2048,768,8,128,1,8,power_law_1.2,0.07651839852333069
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,2048,768,8,128,1,8,power_law_1.01,0.13335039615631103
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,2048,768,8,128,1,8,power_law_1.2,0.08236160278320312
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,2048,768,8,128,1,8,power_law_1.01,0.1504320025444031
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,2048,768,8,128,1,8,power_law_1.2,0.09683200120925903
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,2048,768,8,128,1,8,power_law_1.01,0.2023616075515747
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,2048,768,8,128,1,8,power_law_1.2,0.10695040225982666
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,2048,768,8,128,1,8,power_law_1.01,0.252128005027771
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,2048,768,8,128,1,8,power_law_1.2,0.11819519996643066
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,2048,768,8,128,1,8,power_law_1.2,0.12654080390930175
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,2048,768,8,128,1,8,power_law_1.01,0.4274240016937256
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,2048,768,8,128,1,8,balanced,0.6129759947458903
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,2048,768,8,128,1,8,power_law_1.2,0.1659775972366333
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,2048,768,8,128,1,8,power_law_1.2,0.21528959274291992
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,2048,768,8,128,1,8,power_law_1.01,0.5162112236022949
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,2048,768,8,128,1,8,power_law_1.2,0.2617216110229492
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,2048,768,8,128,1,8,power_law_1.01,0.8155391693115235
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,2048,768,8,128,1,8,power_law_1.2,0.3022016048431396
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,2048,768,8,128,1,8,power_law_1.01,1.0762816429138184
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,2048,768,8,128,1,8,power_law_1.2,0.42710399627685547
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,2048,768,8,128,1,8,power_law_1.01,1.210707187652588
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,2048,768,8,128,1,8,power_law_1.2,0.5679168224334716
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,2048,768,8,128,1,8,balanced,1.5212640762329102
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,2048,768,8,128,1,8,power_law_1.2,0.0385919988155365
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,2048,768,8,128,1,8,power_law_1.2,0.8902463912963867
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,2048,768,8,128,1,8,power_law_1.01,2.4794368743896484
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,2048,768,8,128,1,8,power_law_1.2,0.032128000259399415
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,2048,768,8,128,1,8,power_law_1.2,0.9526592254638672
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,2048,768,8,128,1,8,balanced,0.7611947059631348
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,2048,768,8,128,1,8,power_law_1.01,4.344998550415039
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,2048,768,8,128,1,8,power_law_1.2,0.03170560002326965
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,2048,768,8,128,1,8,power_law_1.2,1.5613632202148438
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,2048,768,8,128,1,8,power_law_1.2,0.036032000184059144
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,2048,768,8,128,1,8,power_law_1.2,4.363391876220703
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,2048,768,8,128,1,8,power_law_1.2,0.03871999979019165
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,2048,768,8,128,1,8,power_law_1.2,0.04839679896831513
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,2048,768,8,128,1,8,power_law_1.2,0.05189759731292724
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,2048,768,8,128,1,8,power_law_1.2,0.053401601314544675
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,2048,768,8,128,1,8,power_law_1.2,0.053504002094268796
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,2048,768,8,128,1,8,power_law_1.2,0.05381119847297668
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,2048,768,8,128,1,8,power_law_1.2,0.055692797899246214
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,2048,768,8,128,1,8,balanced,1.1957226594289143
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,2048,768,8,128,1,8,power_law_1.2,0.055206400156021115
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,2048,768,8,128,1,8,power_law_1.2,0.05994880199432373
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,2048,768,8,128,1,8,power_law_1.2,0.06343039870262146
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,2048,768,8,128,1,8,power_law_1.2,0.06805760264396668
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,2048,768,8,128,1,8,power_law_1.2,0.07340800166130065
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,2048,768,8,128,1,8,power_law_1.2,0.07490559816360473
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,2048,768,8,128,1,8,power_law_1.2,0.08439679741859436
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,2048,768,8,128,1,8,power_law_1.2,0.09978240132331848
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,2048,768,8,128,1,8,power_law_1.2,0.10623359680175781
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,2048,768,8,128,1,8,power_law_1.2,0.1441151976585388
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,2048,768,8,128,1,8,power_law_1.2,0.17348480224609375
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,2048,768,8,128,1,8,power_law_1.2,0.21333119869232178
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,2048,768,8,128,1,8,power_law_1.2,0.2796544075012207
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,2048,768,8,128,1,8,power_law_1.2,0.38024320602416994
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,2048,768,8,128,1,8,power_law_1.2,0.6381247997283935
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,2048,768,8,128,1,8,power_law_1.2,0.8473919868469239
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,2048,768,8,128,1,8,power_law_1.2,0.9849791526794434
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,2048,768,8,128,1,8,power_law_1.2,1.509011173248291
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,2048,768,8,128,1,8,power_law_1.2,4.310355377197266
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,2048,768,8,128,1,8,power_law_1.2,0.03165439963340759
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,2048,768,8,128,1,8,balanced,2.3436266581217446
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,2048,768,8,128,1,8,power_law_1.2,0.029100799560546876
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,2048,768,8,128,1,8,power_law_1.2,0.029574400186538695
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,2048,768,8,128,1,8,power_law_1.2,0.03349120020866394
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,2048,768,8,128,1,8,power_law_1.2,0.03870719969272614
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,2048,768,8,128,1,8,power_law_1.2,0.046828800439834596
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,2048,768,8,128,1,8,power_law_1.2,0.04745599925518036
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,2048,768,8,128,1,8,power_law_1.2,0.04958080053329468
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,2048,768,8,128,1,8,power_law_1.2,0.04927999973297119
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,2048,768,8,128,1,8,power_law_1.2,0.050316798686981204
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,2048,768,8,128,1,8,power_law_1.2,0.05697280168533325
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,2048,768,8,128,1,8,power_law_1.2,0.0579584002494812
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,2048,768,8,128,1,8,power_law_1.2,0.06162559986114502
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,2048,768,8,128,1,8,power_law_1.2,0.06865280270576476
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,2048,768,8,128,1,8,power_law_1.2,0.07273600101470948
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,2048,768,8,128,1,8,power_law_1.2,0.07802240252494812
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,2048,768,8,128,1,8,power_law_1.2,0.07973759770393371
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,2048,768,8,128,2,4,balanced,0.03186666717131933
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,2048,768,8,128,1,8,power_law_1.2,0.09923840165138245
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,2048,768,8,128,2,4,balanced,0.024277334411938984
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,2048,768,8,128,2,4,balanced,0.031157332162062328
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,2048,768,8,128,1,8,power_law_1.2,0.1159551978111267
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,2048,768,8,128,2,4,balanced,0.025226667523384094
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,2048,768,8,128,2,4,balanced,0.03230933348337809
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,2048,768,8,128,2,4,balanced,0.03201599915822347
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,2048,768,8,128,2,4,balanced,0.03665599972009659
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,2048,768,8,128,1,8,power_law_1.2,0.13761919736862183
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,2048,768,8,128,2,4,balanced,0.04121600091457367
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,2048,768,8,128,2,4,balanced,0.054789334535598755
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,2048,768,8,128,1,8,power_law_1.2,0.15021439790725707
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,2048,768,8,128,2,4,balanced,0.06363733112812042
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,2048,768,8,128,2,4,balanced,0.05574400226275126
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,2048,768,8,128,1,8,power_law_1.2,0.22247679233551027
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,2048,768,8,128,2,4,balanced,0.06156266729036967
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,2048,768,8,128,2,4,balanced,0.05489066739877065
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,2048,768,8,128,2,4,balanced,0.06307733555634816
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,2048,768,8,128,2,4,balanced,0.05611733098824819
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,2048,768,8,128,1,8,power_law_1.2,0.3353791952133179
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,2048,768,8,128,2,4,balanced,0.06364800035953522
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,2048,768,8,128,2,4,balanced,0.05663466453552246
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,2048,768,8,128,2,4,balanced,0.0613013356924057
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,2048,768,8,128,2,4,balanced,0.056330665946006775
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,2048,768,8,128,1,8,power_law_1.2,0.4509312152862549
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,2048,768,8,128,2,4,balanced,0.06411199768384297
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,2048,768,8,128,2,4,balanced,0.0566293348868688
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,2048,768,8,128,1,8,power_law_1.2,0.8159104347229004
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,2048,768,8,128,2,4,balanced,0.06600533425807953
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,2048,768,8,128,2,4,balanced,0.058933332562446594
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,2048,768,8,128,2,4,balanced,0.0674239993095398
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,2048,768,8,128,2,4,balanced,0.05919999877611796
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,2048,768,8,128,1,8,power_law_1.2,1.1563072204589844
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,2048,768,8,128,2,4,balanced,0.06820266445477803
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,2048,768,8,128,2,4,balanced,0.06099733213583628
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,2048,768,8,128,1,8,power_law_1.2,1.4740415573120118
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,2048,768,8,128,2,4,balanced,0.07028266787528992
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,2048,768,8,128,2,4,balanced,0.06607466439406078
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,2048,768,8,128,2,4,balanced,0.07523733377456665
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,2048,768,8,128,2,4,balanced,0.06597333153088887
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,2048,768,8,128,1,8,power_law_1.2,1.614739227294922
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,2048,768,8,128,2,4,balanced,0.07799466451009114
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,2048,768,8,128,2,4,balanced,0.072543998559316
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,2048,768,8,128,1,8,power_law_1.2,3.089516830444336
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,2048,768,8,128,2,4,balanced,0.07983999947706859
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,2048,768,8,128,2,4,balanced,0.07936533292134602
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,2048,768,8,128,2,4,balanced,0.08749333024024963
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,2048,768,8,128,1,8,power_law_1.2,6.306137466430664
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,2048,768,8,128,2,4,balanced,0.08489066362380981
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,2048,768,8,128,2,4,balanced,0.09596799810727437
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,2048,768,8,128,2,4,power_law_1.01,0.028275200724601747
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,2048,768,8,128,2,4,balanced,0.09702933828035991
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,2048,768,8,128,2,4,balanced,0.10399466753005981
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,2048,768,8,128,2,4,power_law_1.01,0.03493120074272156
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,2048,768,8,128,2,4,power_law_1.01,0.026694399118423463
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,2048,768,8,128,2,4,power_law_1.01,0.031033599376678468
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,2048,768,8,128,2,4,balanced,0.10930666327476501
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,2048,768,8,128,2,4,power_law_1.01,0.03343999981880188
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,2048,768,8,128,2,4,balanced,0.11209066708882649
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,2048,768,8,128,2,4,power_law_1.01,0.03281919956207276
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,2048,768,8,128,2,4,power_law_1.01,0.03716480135917664
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,2048,768,8,128,2,4,power_law_1.01,0.03821440041065216
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,2048,768,8,128,2,4,balanced,0.1449066698551178
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,2048,768,8,128,2,4,power_law_1.01,0.045535999536514285
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,2048,768,8,128,2,4,balanced,0.1477013329664866
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,2048,768,8,128,2,4,balanced,0.030618667602539062
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,2048,768,8,128,2,4,power_law_1.01,0.04161919951438904
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,2048,768,8,128,2,4,power_law_1.01,0.053523200750350955
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,2048,768,8,128,2,4,balanced,0.031530665854612984
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,2048,768,8,128,2,4,power_law_1.01,0.05942400097846985
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,2048,768,8,128,2,4,power_law_1.01,0.05092480182647705
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,2048,768,8,128,2,4,balanced,0.03239466746648153
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,2048,768,8,128,2,4,balanced,0.1672053337097168
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,2048,768,8,128,2,4,balanced,0.16686934232711792
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,2048,768,8,128,2,4,balanced,0.03667200108369192
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,2048,768,8,128,2,4,power_law_1.01,0.06116480231285095
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,2048,768,8,128,2,4,power_law_1.01,0.053529602289199826
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,2048,768,8,128,2,4,balanced,0.05116266508897146
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,2048,768,8,128,2,4,balanced,0.0524586687485377
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,2048,768,8,128,2,4,power_law_1.01,0.06083199977874756
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,2048,768,8,128,2,4,power_law_1.01,0.054688000679016115
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,2048,768,8,128,2,4,balanced,0.053871999184290566
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,2048,768,8,128,2,4,power_law_1.01,0.06120319962501526
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,2048,768,8,128,2,4,power_law_1.01,0.05553920269012451
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,2048,768,8,128,2,4,balanced,0.054234668612480164
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,2048,768,8,128,2,4,balanced,0.23676800727844238
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,2048,768,8,128,2,4,balanced,0.2281386653582255
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,2048,768,8,128,2,4,power_law_1.01,0.06802560091018676
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,2048,768,8,128,2,4,balanced,0.054666668176651
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,2048,768,8,128,2,4,power_law_1.01,0.05495679974555969
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,2048,768,8,128,2,4,balanced,0.05489066739877065
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,2048,768,8,128,2,4,power_law_1.01,0.07089920043945312
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,2048,768,8,128,2,4,power_law_1.01,0.05863040089607239
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,2048,768,8,128,2,4,balanced,0.055861334005991616
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,2048,768,8,128,2,4,power_law_1.01,0.07164160013198853
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,2048,768,8,128,2,4,power_law_1.01,0.060102397203445436
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,2048,768,8,128,2,4,balanced,0.0576800008614858
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,2048,768,8,128,2,4,balanced,0.05985599756240845
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,2048,768,8,128,2,4,power_law_1.01,0.07598080039024353
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,2048,768,8,128,2,4,power_law_1.01,0.06236799955368042
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,2048,768,8,128,2,4,balanced,0.060789331793785095
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,2048,768,8,128,2,4,power_law_1.01,0.06312320232391358
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,2048,768,8,128,2,4,power_law_1.01,0.0815999984741211
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,2048,768,8,128,2,4,balanced,0.29898667335510254
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,2048,768,8,128,2,4,balanced,0.2715359926223755
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,2048,768,8,128,2,4,power_law_1.01,0.07017599940299987
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,2048,768,8,128,2,4,power_law_1.01,0.08353279829025269
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,2048,768,8,128,2,4,power_law_1.01,0.07281280159950257
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,2048,768,8,128,2,4,power_law_1.01,0.08903040289878845
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,2048,768,8,128,2,4,power_law_1.01,0.07694079875946044
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,2048,768,8,128,2,4,power_law_1.01,0.10826879739761353
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,2048,768,8,128,2,4,balanced,0.07074666519959767
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,2048,768,8,128,2,4,power_law_1.01,0.09143679738044738
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,2048,768,8,128,2,4,power_law_1.01,0.1241536021232605
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,2048,768,8,128,2,4,balanced,0.07089066505432129
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,2048,768,8,128,2,4,power_law_1.01,0.10113919973373413
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,2048,768,8,128,2,4,power_law_1.01,0.13646719455718995
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,2048,768,8,128,2,4,balanced,0.45313600699106854
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,2048,768,8,128,2,4,power_law_1.01,0.11273599863052368
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,2048,768,8,128,2,4,power_law_1.01,0.15143040418624878
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,2048,768,8,128,2,4,power_law_1.01,0.1368127942085266
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,2048,768,8,128,2,4,balanced,0.40628798802693683
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,2048,768,8,128,2,4,power_law_1.01,0.2007551908493042
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,2048,768,8,128,2,4,power_law_1.01,0.1787775993347168
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,2048,768,8,128,2,4,power_law_1.01,0.21765120029449464
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,2048,768,8,128,2,4,balanced,0.07855466504891713
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,2048,768,8,128,2,4,power_law_1.01,0.30512640476226804
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,2048,768,8,128,2,4,power_law_1.01,0.21137919425964355
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,2048,768,8,128,2,4,power_law_1.01,0.3694591999053955
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,2048,768,8,128,2,4,balanced,0.09118400017420451
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,2048,768,8,128,2,4,power_law_1.01,0.2962559938430786
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,2048,768,8,128,2,4,balanced,0.09575999776522319
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,2048,768,8,128,2,4,power_law_1.01,0.5359104156494141
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,2048,768,8,128,2,4,power_law_1.01,0.38818559646606443
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,2048,768,8,128,2,4,power_law_1.01,0.6311039924621582
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,2048,768,8,128,2,4,power_law_1.01,0.6524032115936279
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,2048,768,8,128,2,4,balanced,0.5875413417816162
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,2048,768,8,128,2,4,power_law_1.01,0.7331776142120361
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,2048,768,8,128,2,4,power_law_1.01,0.8353919982910156
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,2048,768,8,128,2,4,balanced,0.5132213433583578
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,2048,768,8,128,2,4,power_law_1.01,0.9167743682861328
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,2048,768,8,128,2,4,balanced,0.12292266885439555
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,2048,768,8,128,2,4,power_law_1.01,1.2467071533203125
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,2048,768,8,128,2,4,power_law_1.01,1.3651840209960937
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,2048,768,8,128,2,4,balanced,0.13846400380134583
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,2048,768,8,128,2,4,power_law_1.01,2.4440832138061523
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,2048,768,8,128,2,4,power_law_1.01,3.0282495498657225
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,2048,768,8,128,2,4,balanced,0.20490666230519614
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,2048,768,8,128,2,4,power_law_1.2,0.028230398893356323
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,2048,768,8,128,2,4,power_law_1.2,0.02768639922142029
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,2048,768,8,128,2,4,balanced,0.25857067108154297
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,2048,768,8,128,2,4,power_law_1.2,0.031718400120735166
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,2048,768,8,128,2,4,balanced,0.7272053559621176
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,2048,768,8,128,2,4,power_law_1.2,0.03526400029659271
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,2048,768,8,128,2,4,power_law_1.01,0.03136000037193298
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,2048,768,8,128,2,4,power_law_1.2,0.04434559941291809
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,2048,768,8,128,2,4,balanced,0.3743199904759725
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,2048,768,8,128,2,4,power_law_1.01,0.03292160034179688
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,2048,768,8,128,2,4,balanced,0.6464426517486572
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,2048,768,8,128,2,4,power_law_1.2,0.055846399068832396
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,2048,768,8,128,2,4,power_law_1.01,0.03324800133705139
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,2048,768,8,128,2,4,power_law_1.2,0.05909119844436646
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,2048,768,8,128,2,4,power_law_1.01,0.03891200125217438
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,2048,768,8,128,2,4,power_law_1.2,0.06231039762496948
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,2048,768,8,128,2,4,balanced,0.48468267917633057
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,2048,768,8,128,2,4,power_law_1.01,0.04089600145816803
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,2048,768,8,128,2,4,power_law_1.2,0.06155520081520081
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,2048,768,8,128,2,4,power_law_1.2,0.06453120112419128
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,2048,768,8,128,2,4,power_law_1.01,0.05245440006256104
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,2048,768,8,128,2,4,power_law_1.2,0.06853119730949402
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,2048,768,8,128,2,4,power_law_1.01,0.05261440277099609
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,2048,768,8,128,2,4,power_law_1.2,0.07289599776268005
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,2048,768,8,128,2,4,power_law_1.01,0.05444480180740356
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,2048,768,8,128,2,4,power_law_1.01,0.055052798986434934
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,2048,768,8,128,2,4,power_law_1.2,0.07415680289268493
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,2048,768,8,128,2,4,balanced,0.7115200360616049
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,2048,768,8,128,2,4,power_law_1.01,0.05661439895629883
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,2048,768,8,128,2,4,power_law_1.2,0.0754047989845276
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,2048,768,8,128,2,4,power_law_1.01,0.06050559878349304
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,2048,768,8,128,2,4,power_law_1.2,0.08287360072135926
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,2048,768,8,128,2,4,balanced,1.1336906750996907
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,2048,768,8,128,2,4,power_law_1.01,0.06547840237617493
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,2048,768,8,128,2,4,power_law_1.2,0.08382080197334289
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,2048,768,8,128,2,4,power_law_1.01,0.0673919975757599
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,2048,768,8,128,2,4,power_law_1.2,0.09472640156745911
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,2048,768,8,128,2,4,power_law_1.01,0.07270399928092956
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,2048,768,8,128,2,4,power_law_1.2,0.11159679889678956
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,2048,768,8,128,2,4,balanced,0.9669919808705648
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,2048,768,8,128,2,4,power_law_1.2,0.12410240173339844
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,2048,768,8,128,2,4,balanced,0.9390079975128174
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,2048,768,8,128,2,4,power_law_1.2,0.14739840030670165
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,2048,768,8,128,2,4,power_law_1.01,0.07996799945831298
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,2048,768,8,128,2,4,power_law_1.2,0.15555839538574218
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,2048,768,8,128,2,4,power_law_1.01,0.08446080088615418
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,2048,768,8,128,2,4,power_law_1.2,0.20901119709014893
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,2048,768,8,128,2,4,power_law_1.2,0.2397439956665039
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,2048,768,8,128,2,4,power_law_1.01,0.09182720184326172
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,2048,768,8,128,2,4,power_law_1.2,0.3255743980407715
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,2048,768,8,128,2,4,power_law_1.01,0.10661760568618775
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,2048,768,8,128,2,4,power_law_1.2,0.4344639778137207
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,2048,768,8,128,2,4,power_law_1.01,0.12842880487442015
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,2048,768,8,128,2,4,power_law_1.2,0.616761589050293
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,2048,768,8,128,2,4,power_law_1.2,0.8727616310119629
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,2048,768,8,128,2,4,balanced,1.1597493489583333
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,2048,768,8,128,2,4,power_law_1.01,0.15124479532241822
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,2048,768,8,128,2,4,power_law_1.2,1.07576322555542
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,2048,768,8,128,2,4,power_law_1.01,0.18869119882583618
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,2048,768,8,128,2,4,power_law_1.01,0.2641727924346924
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,2048,768,8,128,2,4,power_law_1.2,1.6756607055664063
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,2048,768,8,128,2,4,power_law_1.01,0.35396480560302734
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,2048,768,8,128,2,4,power_law_1.01,0.5047103881835937
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,2048,768,8,128,2,4,power_law_1.2,3.039654350280762
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,2048,768,8,128,2,4,power_law_1.01,0.6648767948150635
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,2048,768,8,128,2,4,power_law_1.01,0.9084671974182129
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,2048,768,8,128,2,4,power_law_1.01,1.3874239921569824
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,2048,768,8,128,2,4,power_law_1.01,1.621683120727539
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,2048,768,8,128,2,4,power_law_1.01,2.4156095504760744
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,2048,768,8,128,2,4,balanced,2.182736078898112
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,2048,768,8,128,2,4,power_law_1.2,0.03470720052719116
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,2048,768,8,128,2,4,power_law_1.01,4.756524658203125
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,2048,768,8,128,2,4,balanced,1.8233920733133953
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,2048,768,8,128,2,4,power_law_1.2,0.031065601110458373
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,2048,768,8,128,2,4,power_law_1.2,0.033555200695991515
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,2048,768,8,128,2,4,balanced,1.8710826237996419
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,2048,768,8,128,2,4,power_law_1.2,0.03772160112857818
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,2048,768,8,128,2,4,power_law_1.2,0.03877759873867035
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,2048,768,8,128,2,4,power_law_1.2,0.05262719988822937
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,2048,768,8,128,2,4,power_law_1.2,0.05375999808311462
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,2048,768,8,128,2,4,power_law_1.2,0.055379199981689456
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,2048,768,8,128,2,4,power_law_1.2,0.05634559988975525
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,2048,768,8,128,2,4,power_law_1.2,0.05546240210533142
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,2048,768,8,128,2,4,power_law_1.2,0.059001600742340087
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,2048,768,8,128,2,4,power_law_1.2,0.06098560094833374
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,2048,768,8,128,2,4,power_law_1.2,0.06242560148239136
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,2048,768,8,128,2,4,power_law_1.2,0.0662335991859436
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,2048,768,8,128,2,4,power_law_1.2,0.07146880030632019
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,2048,768,8,128,2,4,power_law_1.2,0.0762880027294159
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,2048,768,8,128,2,4,power_law_1.2,0.08105599880218506
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,2048,768,8,128,2,4,power_law_1.2,0.09233279824256897
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,2048,768,8,128,2,4,power_law_1.2,0.10465279817581177
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,2048,768,8,128,2,4,power_law_1.2,0.12999680042266845
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,2048,768,8,128,2,4,power_law_1.2,0.1527999997138977
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,2048,768,8,128,2,4,power_law_1.2,0.18880640268325805
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,2048,768,8,128,2,4,balanced,3.586437225341797
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,2048,768,8,128,2,4,power_law_1.2,0.22369918823242188
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,2048,768,8,128,2,4,power_law_1.2,0.34835200309753417
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,2048,768,8,128,2,4,power_law_1.2,0.45873279571533204
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,2048,768,8,128,2,4,power_law_1.2,0.6736959934234619
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,2048,768,8,128,2,4,power_law_1.2,0.8279487609863281
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,2048,768,8,128,2,4,power_law_1.2,1.3140735626220703
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,2048,768,8,128,2,4,power_law_1.2,0.03208959996700287
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,2048,768,8,128,2,4,power_law_1.2,0.032569599151611325
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,2048,768,8,128,2,4,power_law_1.2,2.016979217529297
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,2048,768,8,128,2,4,power_law_1.2,0.03313280045986176
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,2048,768,8,128,2,4,power_law_1.2,0.03852159976959228
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,2048,768,8,128,2,4,power_law_1.2,4.1567230224609375
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,2048,768,8,128,2,4,power_law_1.2,0.0394239991903305
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,2048,768,8,128,4,2,balanced,0.0249439999461174
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,2048,768,8,128,2,4,power_law_1.2,0.05182719826698303
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,2048,768,8,128,4,2,balanced,0.026191999514897663
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,2048,768,8,128,2,4,power_law_1.2,0.05244160294532776
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,2048,768,8,128,4,2,balanced,0.029365333418051403
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,2048,768,8,128,2,4,power_law_1.2,0.054713600873947145
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,2048,768,8,128,4,2,balanced,0.04470933477083842
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,2048,768,8,128,2,4,power_law_1.2,0.05516160130500793
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,2048,768,8,128,4,2,balanced,0.06272533535957336
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,2048,768,8,128,2,4,power_law_1.2,0.05759360194206238
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,2048,768,8,128,4,2,balanced,0.06940266489982605
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,2048,768,8,128,2,4,power_law_1.2,0.06053760051727295
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,2048,768,8,128,4,2,balanced,0.07018666466077168
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,2048,768,8,128,2,4,power_law_1.2,0.06699519753456115
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,2048,768,8,128,4,2,balanced,0.0688266654809316
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,2048,768,8,128,2,4,power_law_1.2,0.06910079717636108
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,2048,768,8,128,4,2,balanced,0.06925866504510243
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,2048,768,8,128,4,2,balanced,0.06985066831111908
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,2048,768,8,128,2,4,power_law_1.2,0.07422720193862915
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,2048,768,8,128,4,2,balanced,0.07166933516661327
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,2048,768,8,128,4,2,balanced,0.07212799787521362
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,2048,768,8,128,2,4,power_law_1.2,0.08085119724273682
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,2048,768,8,128,4,2,balanced,0.07326933244864146
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,2048,768,8,128,2,4,power_law_1.2,0.08700159788131714
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,2048,768,8,128,4,2,balanced,0.07589866717656453
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,2048,768,8,128,4,2,balanced,0.08224533498287201
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,2048,768,8,128,2,4,power_law_1.2,0.0946943998336792
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,2048,768,8,128,4,2,balanced,0.08463467160860698
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,2048,768,8,128,2,4,power_law_1.2,0.1145408034324646
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,2048,768,8,128,4,2,balanced,0.09011200070381165
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,2048,768,8,128,2,4,power_law_1.2,0.1288383960723877
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,2048,768,8,128,4,2,balanced,0.10102933645248413
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,2048,768,8,128,4,2,balanced,0.11565867066383362
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,2048,768,8,128,2,4,power_law_1.2,0.15745919942855835
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,2048,768,8,128,2,4,power_law_1.2,0.19882880449295043
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,2048,768,8,128,4,2,balanced,0.137445330619812
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,2048,768,8,128,2,4,power_law_1.2,0.3062016010284424
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,2048,768,8,128,2,4,power_law_1.2,0.3853312015533447
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,2048,768,8,128,4,2,balanced,0.14894400040308634
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,2048,768,8,128,2,4,power_law_1.2,0.5222208023071289
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,2048,768,8,128,2,4,power_law_1.2,0.6809023857116699
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,2048,768,8,128,4,2,balanced,0.19712533553441366
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,2048,768,8,128,2,4,power_law_1.2,1.0929216384887694
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,2048,768,8,128,4,2,balanced,0.0341333324710528
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,2048,768,8,128,2,4,power_law_1.2,1.7031232833862304
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,2048,768,8,128,4,2,balanced,0.03234666585922241
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,2048,768,8,128,4,2,balanced,0.2371573249499003
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,2048,768,8,128,4,2,balanced,0.03565333286921183
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,2048,768,8,128,2,4,power_law_1.2,2.0656831741333006
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,2048,768,8,128,4,2,balanced,0.041936000188191734
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,2048,768,8,128,2,4,power_law_1.2,2.747443199157715
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,2048,768,8,128,4,2,balanced,0.06044800082842509
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,2048,768,8,128,4,2,balanced,0.3121440013249715
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,2048,768,8,128,4,2,balanced,0.06177600224812826
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,2048,768,8,128,4,2,balanced,0.06162666777769724
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,2048,768,8,128,2,4,power_law_1.2,6.383391952514648
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,2048,768,8,128,4,2,balanced,0.061280002196629844
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,2048,768,8,128,4,2,balanced,0.06306666632493337
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,2048,768,8,128,4,2,balanced,0.06309333443641663
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,2048,768,8,128,4,2,balanced,0.4024266799290975
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,2048,768,8,128,4,2,balanced,0.0634933312733968
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,2048,768,8,128,4,2,balanced,0.0653706689675649
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,2048,768,8,128,4,2,balanced,0.06845866640408833
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,2048,768,8,128,4,2,balanced,0.07022933165232341
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,2048,768,8,128,4,2,balanced,0.07720533510049184
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,2048,768,8,128,4,2,balanced,0.6325440009435018
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,2048,768,8,128,4,2,balanced,0.04030933231115341
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,2048,768,8,128,4,2,balanced,0.07856533428033192
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,2048,768,8,128,4,2,balanced,0.042319998145103455
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,2048,768,8,128,4,2,power_law_1.01,0.026700800657272337
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,2048,768,8,128,4,2,balanced,0.08839999636014302
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,2048,768,8,128,4,2,balanced,0.043247997760772705
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,2048,768,8,128,4,2,power_law_1.01,0.02620159983634949
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,2048,768,8,128,4,2,balanced,0.049269333481788635
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,2048,768,8,128,4,2,balanced,0.10028800368309021
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,2048,768,8,128,4,2,balanced,0.06409599880377452
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,2048,768,8,128,4,2,power_law_1.01,0.029516801238059998
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,2048,768,8,128,4,2,power_law_1.01,0.035980799794197084
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,2048,768,8,128,4,2,balanced,0.10656000177065532
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,2048,768,8,128,4,2,balanced,0.06592000027497609
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,2048,768,8,128,4,2,power_law_1.01,0.03958399891853333
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,2048,768,8,128,4,2,balanced,0.06632000207901001
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,2048,768,8,128,4,2,power_law_1.01,0.031033599376678468
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,2048,768,8,128,4,2,power_law_1.01,0.043942400813102724
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,2048,768,8,128,4,2,balanced,0.12706666191418967
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,2048,768,8,128,4,2,balanced,0.7931146621704102
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,2048,768,8,128,4,2,balanced,0.06717866659164429
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,2048,768,8,128,4,2,power_law_1.01,0.03447040021419525
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,2048,768,8,128,4,2,power_law_1.01,0.06111999750137329
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,2048,768,8,128,4,2,balanced,0.06833600004514058
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,2048,768,8,128,4,2,balanced,0.14565333724021912
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,2048,768,8,128,4,2,power_law_1.01,0.03991680145263672
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,2048,768,8,128,4,2,power_law_1.01,0.06250879764556885
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,2048,768,8,128,4,2,balanced,0.06974400083223979
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,2048,768,8,128,4,2,power_law_1.01,0.043315199017524716
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,2048,768,8,128,4,2,power_law_1.01,0.06518399715423584
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,2048,768,8,128,4,2,balanced,0.07167999943097432
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,2048,768,8,128,4,2,power_law_1.01,0.05664640069007874
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,2048,768,8,128,4,2,balanced,0.203274667263031
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,2048,768,8,128,4,2,power_law_1.01,0.06825600266456604
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,2048,768,8,128,4,2,balanced,0.07587733368078868
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,2048,768,8,128,4,2,power_law_1.01,0.057580798864364624
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,2048,768,8,128,4,2,power_law_1.01,0.07004799842834472
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,2048,768,8,128,4,2,balanced,0.07831466694672902
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,2048,768,8,128,4,2,power_law_1.01,0.05950719714164734
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,2048,768,8,128,4,2,balanced,0.2461706598599752
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,2048,768,8,128,4,2,power_law_1.01,0.07438079714775085
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,2048,768,8,128,4,2,power_law_1.01,0.06120960116386413
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,2048,768,8,128,4,2,balanced,0.07993599772453308
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,2048,768,8,128,4,2,power_law_1.01,0.0769919991493225
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,2048,768,8,128,4,2,power_law_1.01,0.06199679970741272
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,2048,768,8,128,4,2,power_law_1.01,0.08235520124435425
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,2048,768,8,128,4,2,balanced,0.9833493232727051
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,2048,768,8,128,4,2,power_law_1.01,0.06653439998626709
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,2048,768,8,128,4,2,balanced,0.3606559832890828
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,2048,768,8,128,4,2,power_law_1.01,0.0813759982585907
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,2048,768,8,128,4,2,power_law_1.01,0.07086719870567322
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,2048,768,8,128,4,2,power_law_1.01,0.08856959939002991
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,2048,768,8,128,4,2,balanced,0.0937493344148
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,2048,768,8,128,4,2,power_law_1.01,0.07445759773254394
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,2048,768,8,128,4,2,power_law_1.01,0.0921343982219696
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,2048,768,8,128,4,2,power_law_1.01,0.07694079875946044
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,2048,768,8,128,4,2,power_law_1.01,0.1082111954689026
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,2048,768,8,128,4,2,balanced,0.09461333354314168
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,2048,768,8,128,4,2,balanced,0.4676640033721924
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,2048,768,8,128,4,2,power_law_1.01,0.08422399759292602
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,2048,768,8,128,4,2,power_law_1.01,0.12012799978256225
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,2048,768,8,128,4,2,power_law_1.01,0.08856959939002991
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,2048,768,8,128,4,2,power_law_1.01,0.13004159927368164
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,2048,768,8,128,4,2,power_law_1.01,0.09765120148658753
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,2048,768,8,128,4,2,power_law_1.01,0.1606719970703125
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,2048,768,8,128,4,2,power_law_1.01,0.11584639549255371
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,2048,768,8,128,4,2,power_law_1.01,0.16885759830474853
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,2048,768,8,128,4,2,power_law_1.01,0.12683520317077637
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,2048,768,8,128,4,2,power_law_1.01,0.23097600936889648
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,2048,768,8,128,4,2,balanced,0.1090133289496104
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,2048,768,8,128,4,2,power_law_1.01,0.03777920007705689
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,2048,768,8,128,4,2,balanced,0.7196426391601562
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,2048,768,8,128,4,2,power_law_1.01,0.1510591983795166
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,2048,768,8,128,4,2,power_law_1.01,0.2791296005249023
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,2048,768,8,128,4,2,balanced,0.130703995625178
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,2048,768,8,128,4,2,power_law_1.01,0.04188799858093262
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,2048,768,8,128,4,2,power_law_1.01,0.17492480278015138
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,2048,768,8,128,4,2,power_law_1.01,0.36420478820800783
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,2048,768,8,128,4,2,power_law_1.01,0.0438400000333786
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,2048,768,8,128,4,2,balanced,0.1393280029296875
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,2048,768,8,128,4,2,balanced,1.5689867337544758
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,2048,768,8,128,4,2,power_law_1.01,0.23172481060028077
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,2048,768,8,128,4,2,power_law_1.01,0.47482881546020506
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,2048,768,8,128,4,2,power_law_1.01,0.04938879907131195
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,2048,768,8,128,4,2,power_law_1.01,0.2914560079574585
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,2048,768,8,128,4,2,power_law_1.01,0.6598336219787597
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,2048,768,8,128,4,2,power_law_1.01,0.05235840082168579
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,2048,768,8,128,4,2,power_law_1.01,0.4164415836334229
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,2048,768,8,128,4,2,power_law_1.01,0.9165120124816895
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,2048,768,8,128,4,2,power_law_1.01,0.06364160180091857
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,2048,768,8,128,4,2,power_law_1.01,0.5544256210327149
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,2048,768,8,128,4,2,power_law_1.01,0.06502400040626526
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,2048,768,8,128,4,2,power_law_1.01,0.9917823791503906
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,2048,768,8,128,4,2,balanced,0.19026132424672446
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,2048,768,8,128,4,2,balanced,0.9577973683675131
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,2048,768,8,128,4,2,power_law_1.01,0.8063808441162109
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,2048,768,8,128,4,2,power_law_1.01,0.06766080260276794
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,2048,768,8,128,4,2,power_law_1.01,1.8275007247924804
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,2048,768,8,128,4,2,power_law_1.01,1.0391167640686034
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,2048,768,8,128,4,2,balanced,0.23809067408243814
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,2048,768,8,128,4,2,power_law_1.01,0.06862720251083373
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,2048,768,8,128,4,2,power_law_1.01,0.07237759828567505
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,2048,768,8,128,4,2,power_law_1.01,1.2581631660461425
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,2048,768,8,128,4,2,power_law_1.01,3.5133697509765627
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,2048,768,8,128,4,2,power_law_1.01,0.07680000066757202
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,2048,768,8,128,4,2,balanced,0.3612000147501628
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,2048,768,8,128,4,2,power_law_1.01,2.1022592544555665
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,2048,768,8,128,4,2,power_law_1.01,0.08316799998283386
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,2048,768,8,128,4,2,power_law_1.2,0.02678399980068207
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,2048,768,8,128,4,2,power_law_1.01,0.08523520231246948
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,2048,768,8,128,4,2,power_law_1.01,4.183583831787109
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,2048,768,8,128,4,2,power_law_1.2,0.027046400308609008
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,2048,768,8,128,4,2,balanced,0.43570133050282794
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,2048,768,8,128,4,2,power_law_1.2,0.029407998919486998
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,2048,768,8,128,4,2,power_law_1.01,0.09520000219345093
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,2048,768,8,128,4,2,power_law_1.2,0.035692799091339114
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,2048,768,8,128,4,2,balanced,1.1904746691385906
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,2048,768,8,128,4,2,power_law_1.2,0.04291839897632599
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,2048,768,8,128,4,2,power_law_1.2,0.058950400352478026
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,2048,768,8,128,4,2,power_law_1.2,0.06299520134925843
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,2048,768,8,128,4,2,power_law_1.01,0.10516480207443238
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,2048,768,8,128,4,2,balanced,0.6283466815948486
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,2048,768,8,128,4,2,power_law_1.2,0.06821759939193725
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,2048,768,8,128,4,2,power_law_1.01,0.11213439702987671
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,2048,768,8,128,4,2,power_law_1.2,0.06952959895133973
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,2048,768,8,128,4,2,power_law_1.2,0.07082239985466003
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,2048,768,8,128,4,2,power_law_1.2,0.07680000066757202
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,2048,768,8,128,4,2,power_law_1.2,0.08271999955177307
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,2048,768,8,128,4,2,power_law_1.01,0.11664639711380005
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,2048,768,8,128,4,2,power_law_1.2,0.08997120261192322
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,2048,768,8,128,4,2,balanced,0.81660262743632
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,2048,768,8,128,4,2,power_law_1.2,0.08300160169601441
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,2048,768,8,128,4,2,power_law_1.01,0.14702080488204955
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,2048,768,8,128,4,2,power_law_1.2,0.09000319838523865
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,2048,768,8,128,4,2,power_law_1.01,0.16492799520492554
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,2048,768,8,128,4,2,power_law_1.2,0.09262719750404358
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,2048,768,8,128,4,2,power_law_1.2,0.11353600025177002
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,2048,768,8,128,4,2,power_law_1.2,0.12551679611206054
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,2048,768,8,128,4,2,power_law_1.01,0.2228991985321045
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,2048,768,8,128,4,2,power_law_1.2,0.13246079683303832
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,2048,768,8,128,4,2,power_law_1.01,0.29690239429473875
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,2048,768,8,128,4,2,power_law_1.2,0.15638400316238404
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,2048,768,8,128,4,2,power_law_1.01,0.40746240615844725
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,2048,768,8,128,4,2,power_law_1.2,0.18897279500961303
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,2048,768,8,128,4,2,balanced,1.2077813148498535
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,2048,768,8,128,4,2,balanced,2.9930826822916665
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,2048,768,8,128,4,2,power_law_1.2,0.2342144012451172
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,2048,768,8,128,4,2,power_law_1.01,0.4900352001190186
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,2048,768,8,128,4,2,balanced,1.8802612622578938
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,2048,768,8,128,4,2,power_law_1.2,0.275763201713562
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,2048,768,8,128,4,2,power_law_1.01,0.7366975784301758
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,2048,768,8,128,4,2,power_law_1.2,0.403545618057251
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,2048,768,8,128,4,2,power_law_1.2,0.5036672115325928
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,2048,768,8,128,4,2,power_law_1.01,0.8655424118041992
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,2048,768,8,128,4,2,power_law_1.2,0.7604544162750244
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,2048,768,8,128,4,2,power_law_1.01,1.377190399169922
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,2048,768,8,128,4,2,power_law_1.2,0.9449343681335449
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,2048,768,8,128,4,2,power_law_1.2,1.130457592010498
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,2048,768,8,128,4,2,power_law_1.01,1.9147903442382812
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,2048,768,8,128,4,2,power_law_1.2,1.91146240234375
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,2048,768,8,128,4,2,power_law_1.01,2.1860736846923827
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,2048,768,8,128,4,2,balanced,1.5956586201985676
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,2048,768,8,128,4,2,power_law_1.2,4.130892944335938
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,2048,768,8,128,4,2,power_law_1.01,3.7824512481689454
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,2048,768,8,128,4,2,power_law_1.01,7.287763214111328
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,2048,768,8,128,4,2,power_law_1.2,0.036051198840141296
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,2048,768,8,128,4,2,power_law_1.2,0.031385600566864014
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,2048,768,8,128,4,2,power_law_1.2,0.034585601091384886
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,2048,768,8,128,4,2,power_law_1.2,0.040217599272727965
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,2048,768,8,128,4,2,balanced,1.9863039652506511
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,2048,768,8,128,4,2,power_law_1.2,0.04183039963245392
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,2048,768,8,128,4,2,power_law_1.2,0.05648639798164368
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,2048,768,8,128,4,2,power_law_1.2,0.059001600742340087
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,2048,768,8,128,4,2,power_law_1.2,0.059494400024414064
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,2048,768,8,128,4,2,power_law_1.2,0.06214399933815003
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,2048,768,8,128,4,2,power_law_1.2,0.06185600161552429
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,2048,768,8,128,4,2,power_law_1.2,0.06629760265350342
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,2048,768,8,128,4,2,power_law_1.2,0.0735360026359558
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,2048,768,8,128,4,2,balanced,3.600581487019857
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,2048,768,8,128,4,2,power_law_1.2,0.07242239713668823
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,2048,768,8,128,4,2,power_law_1.2,0.07774720191955567
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,2048,768,8,128,4,2,balanced,3.1389760971069336
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,2048,768,8,128,4,2,power_law_1.2,0.08381440043449402
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,2048,768,8,128,4,2,power_law_1.2,0.08909440040588379
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,2048,768,8,128,4,2,power_law_1.2,0.10092159509658813
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,2048,768,8,128,4,2,power_law_1.2,0.11936639547348023
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,2048,768,8,128,4,2,power_law_1.2,0.13118720054626465
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,2048,768,8,128,4,2,power_law_1.2,0.15560959577560424
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,2048,768,8,128,4,2,power_law_1.2,0.18106240034103394
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,2048,768,8,128,4,2,power_law_1.2,0.24395520687103273
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,2048,768,8,128,4,2,power_law_1.2,0.3030208110809326
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,2048,768,8,128,4,2,power_law_1.2,0.41680002212524414
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,2048,768,8,128,4,2,power_law_1.2,0.5665535926818848
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,2048,768,8,128,4,2,power_law_1.2,0.8360320091247558
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,2048,768,8,128,4,2,power_law_1.2,1.0867520332336427
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,2048,768,8,128,4,2,power_law_1.2,1.3784895896911622
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,2048,768,8,128,4,2,power_law_1.2,2.3175039291381836
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,2048,768,8,128,4,2,power_law_1.2,4.875526428222656
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,2048,768,8,128,4,2,balanced,6.196367899576823
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,2048,768,8,128,4,2,power_law_1.2,0.03792639970779419
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,2048,768,8,128,4,2,power_law_1.2,0.04261119961738587
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,2048,768,8,128,4,2,power_law_1.2,0.043993601202964784
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,2048,768,8,128,4,2,power_law_1.2,0.04872319996356964
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,2048,768,8,128,4,2,power_law_1.2,0.050969600677490234
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,4096,1536,8,128,1,8,balanced,0.03793599953254064
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,2048,768,8,128,4,2,power_law_1.2,0.0637440025806427
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,2048,768,8,128,4,2,power_law_1.2,0.0645695984363556
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,4096,1536,8,128,1,8,balanced,0.04855999847253164
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,2048,768,8,128,4,2,power_law_1.2,0.06709120273590088
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,4096,1536,8,128,1,8,balanced,0.06287999947865804
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,2048,768,8,128,4,2,power_law_1.2,0.06933760046958923
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,4096,1536,8,128,1,8,balanced,0.09674666325251262
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,4096,1536,8,128,1,8,balanced,0.17453867197036743
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,2048,768,8,128,4,2,power_law_1.2,0.0717311978340149
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,4096,1536,8,128,1,8,balanced,0.17340266704559326
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,2048,768,8,128,4,2,power_law_1.2,0.07774080038070678
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,4096,1536,8,128,1,8,balanced,0.17363733053207397
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,2048,768,8,128,4,2,power_law_1.2,0.08163840174674988
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,4096,1536,8,128,1,8,balanced,0.1711733341217041
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,2048,768,8,128,4,2,power_law_1.2,0.08621439933776856
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,4096,1536,8,128,1,8,balanced,0.1726613243420919
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,2048,768,8,128,4,2,power_law_1.2,0.09301120042800903
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,4096,1536,8,128,1,8,balanced,0.17223467429478964
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,4096,1536,8,128,1,8,balanced,0.1755946675936381
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,2048,768,8,128,4,2,power_law_1.2,0.10437120199203491
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,4096,1536,8,128,1,8,balanced,0.1766666571299235
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,4096,1536,8,128,1,8,balanced,0.17644266287485758
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,2048,768,8,128,4,2,power_law_1.2,0.11038080453872681
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,4096,1536,8,128,1,8,balanced,0.1814346710840861
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,4096,1536,8,128,1,8,balanced,0.03534399966398875
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,4096,1536,8,128,1,8,balanced,0.18616533279418945
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,4096,1536,8,128,1,8,balanced,0.03668266783157984
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,4096,1536,8,128,1,8,balanced,0.18681599696477255
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,4096,1536,8,128,1,8,balanced,0.04771199822425842
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,2048,768,8,128,4,2,power_law_1.2,0.1190335988998413
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,4096,1536,8,128,1,8,balanced,0.19079999128977457
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,4096,1536,8,128,1,8,balanced,0.06938133140405019
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,2048,768,8,128,4,2,power_law_1.2,0.15322240591049194
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,4096,1536,8,128,1,8,balanced,0.10529067118962605
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,4096,1536,8,128,1,8,balanced,0.19504000743230185
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,2048,768,8,128,4,2,power_law_1.2,0.17212799787521363
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,4096,1536,8,128,1,8,balanced,0.10693867007891338
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,4096,1536,8,128,1,8,balanced,0.21538132429122925
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,4096,1536,8,128,1,8,balanced,0.10724799831708272
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,2048,768,8,128,4,2,power_law_1.2,0.22040319442749023
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,4096,1536,8,128,1,8,power_law_1.01,0.0938431978225708
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,4096,1536,8,128,1,8,balanced,0.10758933424949646
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,4096,1536,8,128,1,8,balanced,0.22006932894388834
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,2048,768,8,128,4,2,power_law_1.2,0.2904191970825195
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,4096,1536,8,128,1,8,power_law_1.01,0.05295360088348389
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,4096,1536,8,128,1,8,balanced,0.10809066891670227
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,2048,768,8,128,4,2,power_law_1.2,0.38800640106201173
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,4096,1536,8,128,1,8,balanced,0.24610666433970133
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,4096,1536,8,128,1,8,power_law_1.01,0.06349440217018128
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,4096,1536,8,128,1,8,balanced,0.1090186635653178
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,2048,768,8,128,4,2,power_law_1.2,0.49000959396362304
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,4096,1536,8,128,1,8,power_law_1.01,0.08643839955329895
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,4096,1536,8,128,1,8,balanced,0.10910399754842122
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,2048,768,8,128,4,2,power_law_1.2,0.7368256092071533
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,4096,1536,8,128,1,8,balanced,0.29011199871699017
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,4096,1536,8,128,1,8,balanced,0.11059733231862386
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,4096,1536,8,128,1,8,power_law_1.01,0.12291840314865113
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,4096,1536,8,128,1,8,balanced,0.030533333619435627
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,2048,768,8,128,4,2,power_law_1.2,1.0938112258911132
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,4096,1536,8,128,1,8,balanced,0.11222933729489644
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,4096,1536,8,128,1,8,power_law_1.01,0.15611519813537597
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,4096,1536,8,128,1,8,balanced,0.03379733363787333
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,2048,768,8,128,4,2,power_law_1.2,1.5273344039916992
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,4096,1536,8,128,1,8,power_law_1.01,0.15924479961395263
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,4096,1536,8,128,1,8,balanced,0.11379200220108032
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,4096,1536,8,128,1,8,balanced,0.30717867612838745
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,4096,1536,8,128,1,8,balanced,0.0444160004456838
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,4096,1536,8,128,1,8,balanced,0.12054933110872905
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,4096,1536,8,128,1,8,power_law_1.01,0.1618880033493042
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,2048,768,8,128,4,2,power_law_1.2,1.9339328765869142
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,4096,1536,8,128,1,8,balanced,0.06499200065930684
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,4096,1536,8,128,1,8,power_law_1.01,0.1717120051383972
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,4096,1536,8,128,1,8,balanced,0.12154666582743327
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,2048,768,8,128,4,2,power_law_1.2,2.6352512359619142
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,4096,1536,8,128,1,8,balanced,0.1009173293908437
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,4096,1536,8,128,1,8,power_law_1.01,0.1739967942237854
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,4096,1536,8,128,1,8,balanced,0.43511998653411865
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,4096,1536,8,128,1,8,balanced,0.1262079974015554
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,4096,1536,8,128,1,8,balanced,0.10147200028101604
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,2048,768,8,128,4,2,power_law_1.2,4.116044616699218
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,4096,1536,8,128,1,8,power_law_1.01,0.179257595539093
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,4096,1536,8,128,1,8,balanced,0.10212266445159912
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,4096,1536,8,128,1,8,balanced,0.1339466671148936
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,4096,1536,8,128,1,8,power_law_1.01,0.1817023992538452
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,4096,1536,8,128,1,8,balanced,0.10211199522018433
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,2048,768,8,128,4,2,power_law_1.2,8.137433624267578
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,4096,1536,8,128,1,8,balanced,0.14643200238545737
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,4096,1536,8,128,1,8,power_law_1.01,0.1974527955055237
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,4096,1536,8,128,1,8,balanced,0.10365866621335347
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,4096,1536,8,128,1,8,balanced,0.5331253210703532
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,4096,1536,8,128,1,8,power_law_1.01,0.19081599712371827
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,4096,1536,8,128,1,8,balanced,0.10468266407648723
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,4096,1536,8,128,1,8,balanced,0.1600266695022583
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,4096,1536,8,128,1,8,power_law_1.01,0.21541759967803956
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,4096,1536,8,128,1,8,balanced,0.10586133599281311
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,4096,1536,8,128,1,8,balanced,0.18090667327245077
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,4096,1536,8,128,1,8,power_law_1.01,0.22877440452575684
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,4096,1536,8,128,1,8,balanced,0.10785599549611409
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,4096,1536,8,128,1,8,power_law_1.01,0.20942718982696534
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,4096,1536,8,128,1,8,balanced,0.11045866211255391
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,4096,1536,8,128,1,8,balanced,0.23448532819747925
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,4096,1536,8,128,1,8,power_law_1.01,0.24828801155090333
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,4096,1536,8,128,1,8,balanced,0.1127946674823761
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,4096,1536,8,128,1,8,power_law_1.01,0.06798719763755798
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,4096,1536,8,128,1,8,balanced,0.7761440277099609
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,4096,1536,8,128,1,8,power_law_1.01,0.27621119022369384
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,4096,1536,8,128,1,8,power_law_1.01,0.045721599459648134
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,4096,1536,8,128,1,8,power_law_1.01,0.05120000243186951
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,4096,1536,8,128,1,8,power_law_1.01,0.31831040382385256
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,4096,1536,8,128,1,8,balanced,0.25711466868718463
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,4096,1536,8,128,1,8,power_law_1.01,0.06629120111465454
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,4096,1536,8,128,1,8,power_law_1.01,0.335916805267334
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,4096,1536,8,128,1,8,power_law_1.01,0.0756608009338379
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,4096,1536,8,128,1,8,power_law_1.01,0.09968000054359435
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,4096,1536,8,128,1,8,power_law_1.01,0.4453440189361572
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,4096,1536,8,128,1,8,balanced,0.12012799580891927
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,4096,1536,8,128,1,8,power_law_1.01,0.09934719800949096
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,4096,1536,8,128,1,8,power_law_1.01,0.5396096229553222
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,4096,1536,8,128,1,8,balanced,0.12108266353607178
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,4096,1536,8,128,1,8,power_law_1.01,0.10476160049438477
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,4096,1536,8,128,1,8,balanced,0.3638240098953247
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,4096,1536,8,128,1,8,power_law_1.01,0.10551680326461792
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,4096,1536,8,128,1,8,power_law_1.01,0.7338687896728515
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,4096,1536,8,128,1,8,power_law_1.01,0.1011199951171875
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,4096,1536,8,128,1,8,power_law_1.01,0.9073344230651855
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,4096,1536,8,128,1,8,power_law_1.01,0.11399680376052856
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,4096,1536,8,128,1,8,balanced,1.0183146794637044
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,4096,1536,8,128,1,8,power_law_1.01,0.11932159662246704
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,4096,1536,8,128,1,8,power_law_1.01,1.1720576286315918
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,4096,1536,8,128,1,8,power_law_1.01,0.12718720436096193
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,4096,1536,8,128,1,8,power_law_1.01,1.704876708984375
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,4096,1536,8,128,1,8,power_law_1.01,0.12463999986648559
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,4096,1536,8,128,1,8,balanced,0.4436426560084025
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,4096,1536,8,128,1,8,power_law_1.01,0.1366912007331848
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,4096,1536,8,128,1,8,power_law_1.01,2.2881216049194335
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,4096,1536,8,128,1,8,power_law_1.01,0.13948800563812255
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,4096,1536,8,128,1,8,power_law_1.01,0.14104959964752198
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,4096,1536,8,128,1,8,power_law_1.01,3.4880001068115236
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,4096,1536,8,128,1,8,power_law_1.01,0.16247040033340454
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,4096,1536,8,128,1,8,balanced,0.13063466548919678
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,4096,1536,8,128,1,8,power_law_1.01,0.19679360389709472
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,4096,1536,8,128,1,8,power_law_1.01,7.1007743835449215
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,4096,1536,8,128,1,8,power_law_1.01,0.20869760513305663
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,4096,1536,8,128,1,8,balanced,0.14458133776982626
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,4096,1536,8,128,1,8,power_law_1.01,0.24091520309448242
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,4096,1536,8,128,1,8,balanced,0.6424746513366699
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,4096,1536,8,128,1,8,power_law_1.01,0.31766400337219236
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,4096,1536,8,128,1,8,balanced,0.1532319982846578
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,4096,1536,8,128,1,8,power_law_1.01,0.40015997886657717
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,4096,1536,8,128,1,8,balanced,1.2656853199005127
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,4096,1536,8,128,1,8,power_law_1.01,0.4817791938781738
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,4096,1536,8,128,1,8,balanced,0.18750399351119995
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,4096,1536,8,128,1,8,power_law_1.01,0.6694784164428711
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,4096,1536,8,128,1,8,power_law_1.01,1.1056896209716798
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,4096,1536,8,128,1,8,balanced,0.2042293349901835
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,4096,1536,8,128,1,8,power_law_1.01,1.2916928291320802
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,4096,1536,8,128,1,8,power_law_1.01,1.6351232528686523
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,4096,1536,8,128,1,8,balanced,0.3024746576944987
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,4096,1536,8,128,1,8,power_law_1.01,2.854969596862793
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,4096,1536,8,128,1,8,balanced,0.8334506352742513
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,4096,1536,8,128,1,8,power_law_1.01,5.079891204833984
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,4096,1536,8,128,1,8,balanced,0.3592373530069987
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,4096,1536,8,128,1,8,power_law_1.2,0.0861631989479065
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,4096,1536,8,128,1,8,power_law_1.01,0.06584320068359376
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,4096,1536,8,128,1,8,power_law_1.2,0.055827200412750244
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,4096,1536,8,128,1,8,power_law_1.2,0.06170880198478699
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,4096,1536,8,128,1,8,balanced,0.5205386479695638
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,4096,1536,8,128,1,8,power_law_1.01,0.07134079933166504
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,4096,1536,8,128,1,8,power_law_1.2,0.08140799999237061
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,4096,1536,8,128,1,8,power_law_1.01,0.04410240054130554
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,4096,1536,8,128,1,8,power_law_1.2,0.10618879795074462
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,4096,1536,8,128,1,8,power_law_1.01,0.06352639794349671
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,4096,1536,8,128,1,8,power_law_1.2,0.15479040145874023
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,4096,1536,8,128,1,8,balanced,1.9903519948323567
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,4096,1536,8,128,1,8,power_law_1.01,0.07329279780387879
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,4096,1536,8,128,1,8,power_law_1.2,0.1611199975013733
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,4096,1536,8,128,1,8,balanced,0.688426653544108
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,4096,1536,8,128,1,8,balanced,1.0436159769694011
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,4096,1536,8,128,1,8,power_law_1.01,0.09561600089073181
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,4096,1536,8,128,1,8,power_law_1.2,0.16348799467086791
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,4096,1536,8,128,1,8,power_law_1.01,0.09816960096359253
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,4096,1536,8,128,1,8,power_law_1.2,0.1732800006866455
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,4096,1536,8,128,1,8,power_law_1.01,0.1047551989555359
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,4096,1536,8,128,1,8,power_law_1.2,0.17420799732208253
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,4096,1536,8,128,1,8,power_law_1.01,0.1097216010093689
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,4096,1536,8,128,1,8,power_law_1.2,0.1815168023109436
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,4096,1536,8,128,1,8,power_law_1.2,0.18968960046768188
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,4096,1536,8,128,1,8,power_law_1.01,0.11111680269241334
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,4096,1536,8,128,1,8,balanced,1.0241866906483967
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,4096,1536,8,128,1,8,power_law_1.01,0.11715199947357177
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,4096,1536,8,128,1,8,power_law_1.2,0.2018752098083496
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,4096,1536,8,128,1,8,power_law_1.01,0.12142720222473144
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,4096,1536,8,128,1,8,power_law_1.2,0.1967039942741394
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,4096,1536,8,128,1,8,power_law_1.01,0.13127039670944213
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,4096,1536,8,128,1,8,power_law_1.2,0.2240000009536743
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,4096,1536,8,128,1,8,power_law_1.01,0.14283519983291626
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,4096,1536,8,128,1,8,power_law_1.2,0.2248703956604004
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,4096,1536,8,128,1,8,power_law_1.2,0.23797121047973632
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,4096,1536,8,128,1,8,power_law_1.2,0.2650048017501831
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,4096,1536,8,128,1,8,power_law_1.01,0.14600319862365724
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,4096,1536,8,128,1,8,balanced,1.3621973991394043
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,4096,1536,8,128,1,8,power_law_1.2,0.30785279273986815
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,4096,1536,8,128,1,8,balanced,1.6239946683247883
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,4096,1536,8,128,1,8,power_law_1.01,0.15237120389938355
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,4096,1536,8,128,1,8,power_law_1.2,0.3699520111083984
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,4096,1536,8,128,1,8,power_law_1.2,0.39366400241851807
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,4096,1536,8,128,1,8,power_law_1.01,0.15486079454421997
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,4096,1536,8,128,1,8,power_law_1.2,0.4934591770172119
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,4096,1536,8,128,1,8,power_law_1.01,0.18332159519195557
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,4096,1536,8,128,1,8,power_law_1.2,0.6086336135864258
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,4096,1536,8,128,1,8,power_law_1.01,0.2203455924987793
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,4096,1536,8,128,1,8,power_law_1.2,0.9392895698547363
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,4096,1536,8,128,1,8,power_law_1.01,0.2616447925567627
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,4096,1536,8,128,1,8,power_law_1.2,0.955840015411377
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,4096,1536,8,128,1,8,power_law_1.01,0.3497535943984985
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,4096,1536,8,128,1,8,power_law_1.2,1.7132223129272461
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,4096,1536,8,128,1,8,balanced,1.6874826749165852
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,4096,1536,8,128,1,8,power_law_1.01,0.43225598335266113
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,4096,1536,8,128,1,8,power_law_1.2,2.281388854980469
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,4096,1536,8,128,1,8,power_law_1.01,0.6132991790771485
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,4096,1536,8,128,1,8,power_law_1.01,0.795091199874878
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,4096,1536,8,128,1,8,power_law_1.2,2.6600320816040037
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,4096,1536,8,128,1,8,balanced,3.8043785095214844
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,4096,1536,8,128,1,8,power_law_1.01,1.2354816436767577
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,4096,1536,8,128,1,8,power_law_1.2,5.388217544555664
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,4096,1536,8,128,1,8,power_law_1.01,1.7823167800903321
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,4096,1536,8,128,1,8,power_law_1.01,2.1557376861572264
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,4096,1536,8,128,1,8,power_law_1.2,8.948595428466797
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,4096,1536,8,128,1,8,power_law_1.01,3.152774429321289
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,4096,1536,8,128,1,8,power_law_1.01,4.70384635925293
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,4096,1536,8,128,1,8,power_law_1.01,7.883602905273437
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,4096,1536,8,128,1,8,balanced,2.655738671620687
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,4096,1536,8,128,1,8,balanced,3.136207898457845
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,4096,1536,8,128,1,8,power_law_1.2,0.06723840236663818
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,4096,1536,8,128,1,8,power_law_1.2,0.0424703985452652
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,4096,1536,8,128,1,8,power_law_1.2,0.0507968008518219
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,4096,1536,8,128,1,8,power_law_1.2,0.06358399987220764
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,4096,1536,8,128,1,8,power_law_1.2,0.07174400091171265
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,4096,1536,8,128,1,8,power_law_1.2,0.09874560236930847
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,4096,1536,8,128,1,8,power_law_1.2,0.10136959552764893
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,4096,1536,8,128,1,8,power_law_1.2,0.10610560178756714
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,4096,1536,8,128,1,8,power_law_1.2,0.10894720554351807
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,4096,1536,8,128,1,8,power_law_1.2,0.10598399639129638
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,4096,1536,8,128,1,8,power_law_1.2,0.10862079858779908
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,4096,1536,8,128,1,8,power_law_1.2,0.12095359563827515
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,4096,1536,8,128,1,8,power_law_1.2,0.12811520099639892
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,4096,1536,8,128,1,8,power_law_1.2,0.12654080390930175
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,4096,1536,8,128,1,8,power_law_1.2,0.139136004447937
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,4096,1536,8,128,1,8,balanced,5.260064125061035
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,4096,1536,8,128,1,8,power_law_1.2,0.06511359810829162
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,4096,1536,8,128,1,8,power_law_1.2,0.1479423999786377
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,4096,1536,8,128,1,8,power_law_1.2,0.03854719996452331
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,4096,1536,8,128,1,8,power_law_1.2,0.1506816029548645
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,4096,1536,8,128,1,8,power_law_1.2,0.04743039906024933
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,4096,1536,8,128,1,8,power_law_1.2,0.1746559977531433
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,4096,1536,8,128,1,8,power_law_1.2,0.0592960000038147
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,4096,1536,8,128,1,8,power_law_1.2,0.19214080572128295
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,4096,1536,8,128,1,8,power_law_1.2,0.06716799736022949
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,4096,1536,8,128,1,8,power_law_1.2,0.2321216106414795
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,4096,1536,8,128,1,8,power_law_1.2,0.09905920028686524
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,4096,1536,8,128,1,8,power_law_1.2,0.2865600109100342
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,4096,1536,8,128,1,8,power_law_1.2,0.09811199903488159
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,4096,1536,8,128,1,8,power_law_1.2,0.4212800025939941
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,4096,1536,8,128,1,8,power_law_1.2,0.10586240291595458
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,4096,1536,8,128,2,4,balanced,0.03814399987459183
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,4096,1536,8,128,1,8,power_law_1.2,0.10804480314254761
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,4096,1536,8,128,1,8,power_law_1.2,0.4681663990020752
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,4096,1536,8,128,2,4,balanced,0.04629333317279816
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,4096,1536,8,128,1,8,power_law_1.2,0.11077760457992554
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,4096,1536,8,128,1,8,power_law_1.2,0.619046401977539
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,4096,1536,8,128,2,4,balanced,0.066170667608579
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,4096,1536,8,128,1,8,power_law_1.2,0.12119040489196778
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,4096,1536,8,128,2,4,balanced,0.09867200255393982
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,4096,1536,8,128,1,8,power_law_1.2,0.7745664119720459
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,4096,1536,8,128,2,4,balanced,0.17422932386398315
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,4096,1536,8,128,1,8,power_law_1.2,0.1260800004005432
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,4096,1536,8,128,2,4,balanced,0.1728586753209432
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,4096,1536,8,128,1,8,power_law_1.2,1.0910911560058594
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,4096,1536,8,128,1,8,power_law_1.2,0.1360703945159912
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,4096,1536,8,128,2,4,balanced,0.17398399114608765
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,4096,1536,8,128,2,4,balanced,0.17398399114608765
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,4096,1536,8,128,1,8,power_law_1.2,0.15123200416564941
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,4096,1536,8,128,1,8,power_law_1.2,1.581107234954834
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,4096,1536,8,128,2,4,balanced,0.17402132352193198
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,4096,1536,8,128,2,4,balanced,0.17493865887324014
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,4096,1536,8,128,1,8,power_law_1.2,2.3949440002441404
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,4096,1536,8,128,2,4,balanced,0.17631999651590982
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,4096,1536,8,128,2,4,balanced,0.17782400051752725
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,4096,1536,8,128,1,8,power_law_1.2,0.15587199926376344
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,4096,1536,8,128,2,4,balanced,0.17939732472101846
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,4096,1536,8,128,1,8,power_law_1.2,3.462335968017578
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,4096,1536,8,128,2,4,balanced,0.18459200859069824
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,4096,1536,8,128,1,8,power_law_1.2,0.1591423988342285
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,4096,1536,8,128,2,4,balanced,0.19106133778889975
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,4096,1536,8,128,1,8,power_law_1.2,7.707257843017578
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,4096,1536,8,128,2,4,balanced,0.19322667519251505
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,4096,1536,8,128,2,4,balanced,0.20092799266179404
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,4096,1536,8,128,1,8,power_law_1.2,0.1704192042350769
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,4096,1536,8,128,2,4,balanced,0.20943999290466309
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,4096,1536,8,128,1,8,power_law_1.2,0.2015615940093994
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,4096,1536,8,128,2,4,balanced,0.22628267606099448
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,4096,1536,8,128,1,8,power_law_1.2,0.26363520622253417
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,4096,1536,8,128,2,4,balanced,0.24217599630355835
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,4096,1536,8,128,1,8,power_law_1.2,0.2952064037322998
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,4096,1536,8,128,2,4,balanced,0.2797706723213196
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,4096,1536,8,128,1,8,power_law_1.2,0.373305606842041
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,4096,1536,8,128,1,8,power_law_1.2,0.5359551906585693
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,4096,1536,8,128,2,4,balanced,0.31990933418273926
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,4096,1536,8,128,1,8,power_law_1.2,0.7661439895629882
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,4096,1536,8,128,1,8,power_law_1.2,1.0372544288635255
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,4096,1536,8,128,2,4,balanced,0.35652267932891846
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,4096,1536,8,128,1,8,power_law_1.2,1.4811455726623535
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,4096,1536,8,128,1,8,power_law_1.2,2.2553216934204103
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,4096,1536,8,128,1,8,power_law_1.2,2.974847984313965
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,4096,1536,8,128,2,4,balanced,0.5098559856414795
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,4096,1536,8,128,1,8,power_law_1.2,3.6947776794433596
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,4096,1536,8,128,1,8,power_law_1.2,6.677523040771485
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,4096,1536,8,128,2,4,balanced,0.6315786838531494
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,4096,1536,8,128,1,8,power_law_1.2,13.968492126464843
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,4096,1536,8,128,2,4,balanced,0.03418133407831192
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,4096,1536,8,128,2,4,balanced,0.036559998989105225
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,4096,1536,8,128,2,4,balanced,0.048432002464930214
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,4096,1536,8,128,2,4,balanced,0.9261813163757324
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,4096,1536,8,128,2,4,balanced,0.06915733218193054
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,4096,1536,8,128,2,4,balanced,0.10685867071151733
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,4096,1536,8,128,2,4,balanced,0.1076639990011851
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,4096,1536,8,128,2,4,balanced,0.1076639990011851
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,4096,1536,8,128,2,4,balanced,0.10912000139554341
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,4096,1536,8,128,2,4,power_law_1.01,0.06332160234451294
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,4096,1536,8,128,2,4,balanced,0.035375999907652535
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,4096,1536,8,128,2,4,balanced,0.11012799541155498
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,4096,1536,8,128,2,4,power_law_1.01,0.0515392005443573
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,4096,1536,8,128,2,4,balanced,0.11126400033632915
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,4096,1536,8,128,2,4,balanced,1.2154773076375325
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,4096,1536,8,128,2,4,balanced,0.03751466671625773
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,4096,1536,8,128,2,4,power_law_1.01,0.061919999122619626
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,4096,1536,8,128,2,4,balanced,0.1109333336353302
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,4096,1536,8,128,2,4,balanced,0.11433600385983785
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,4096,1536,8,128,2,4,balanced,0.04706666866938273
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,4096,1536,8,128,2,4,power_law_1.01,0.07585920095443725
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,4096,1536,8,128,2,4,balanced,0.11586133639017741
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,4096,1536,8,128,2,4,balanced,0.06765333314736684
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,4096,1536,8,128,2,4,power_law_1.01,0.10243840217590332
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,4096,1536,8,128,2,4,balanced,0.11922666430473328
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,4096,1536,8,128,2,4,balanced,0.10341866811116536
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,4096,1536,8,128,2,4,power_law_1.01,0.15576319694519042
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,4096,1536,8,128,2,4,balanced,0.12523200114568075
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,4096,1536,8,128,2,4,balanced,0.10575466354688008
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,4096,1536,8,128,2,4,power_law_1.01,0.16187520027160646
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,4096,1536,8,128,2,4,power_law_1.01,0.04775039851665497
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,4096,1536,8,128,2,4,balanced,0.10652800401051839
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,4096,1536,8,128,2,4,balanced,0.12643200159072876
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,4096,1536,8,128,2,4,power_law_1.01,0.1606528043746948
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,4096,1536,8,128,2,4,balanced,0.10733333230018616
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,4096,1536,8,128,2,4,power_law_1.01,0.03893760144710541
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,4096,1536,8,128,2,4,balanced,0.1344213287035624
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,4096,1536,8,128,2,4,power_law_1.01,0.1693120002746582
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,4096,1536,8,128,2,4,balanced,0.10894399881362915
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,4096,1536,8,128,2,4,power_law_1.01,0.050323200225830075
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,4096,1536,8,128,2,4,balanced,0.14638933539390564
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,4096,1536,8,128,2,4,power_law_1.01,0.17439359426498413
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,4096,1536,8,128,2,4,balanced,1.5198453267415364
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,4096,1536,8,128,2,4,power_law_1.01,0.06351360082626342
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,4096,1536,8,128,2,4,balanced,0.11080533266067505
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,4096,1536,8,128,2,4,power_law_1.01,0.17499519586563111
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,4096,1536,8,128,2,4,balanced,0.16250133514404297
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,4096,1536,8,128,2,4,balanced,0.11215999722480774
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,4096,1536,8,128,2,4,power_law_1.01,0.0713919997215271
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,4096,1536,8,128,2,4,power_law_1.01,0.18077440261840821
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,4096,1536,8,128,2,4,balanced,0.11539733409881592
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,4096,1536,8,128,2,4,power_law_1.01,0.09582719802856446
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,4096,1536,8,128,2,4,balanced,0.18173333009084067
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,4096,1536,8,128,2,4,power_law_1.01,0.18823039531707764
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,4096,1536,8,128,2,4,balanced,0.11895466844240825
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,4096,1536,8,128,2,4,power_law_1.01,0.09891200065612793
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,4096,1536,8,128,2,4,power_law_1.01,0.1945024013519287
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,4096,1536,8,128,2,4,balanced,0.2158613403638204
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,4096,1536,8,128,2,4,power_law_1.01,0.10037120580673217
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,4096,1536,8,128,2,4,balanced,0.12257066369056702
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,4096,1536,8,128,2,4,power_law_1.01,0.2092479944229126
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,4096,1536,8,128,2,4,power_law_1.01,0.10416640043258667
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,4096,1536,8,128,2,4,power_law_1.01,0.10641920566558838
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,4096,1536,8,128,2,4,power_law_1.01,0.20721919536590577
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,4096,1536,8,128,2,4,balanced,0.27163734038670856
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,4096,1536,8,128,2,4,power_law_1.01,0.11050239801406861
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,4096,1536,8,128,2,4,power_law_1.01,0.2170367956161499
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,4096,1536,8,128,2,4,power_law_1.01,0.11667200326919555
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,4096,1536,8,128,2,4,balanced,0.13450133800506592
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,4096,1536,8,128,2,4,power_law_1.01,0.25004799365997316
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,4096,1536,8,128,2,4,balanced,0.3126239975293477
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,4096,1536,8,128,2,4,power_law_1.01,0.12407040596008301
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,4096,1536,8,128,2,4,power_law_1.01,0.26051199436187744
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,4096,1536,8,128,2,4,balanced,0.13726400335629782
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,4096,1536,8,128,2,4,power_law_1.01,0.12127360105514526
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,4096,1536,8,128,2,4,power_law_1.01,0.31527678966522216
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,4096,1536,8,128,2,4,power_law_1.01,0.13308800458908082
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,4096,1536,8,128,2,4,power_law_1.01,0.3771775960922241
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,4096,1536,8,128,2,4,balanced,0.4503733317057292
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,4096,1536,8,128,2,4,power_law_1.01,0.14064639806747437
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,4096,1536,8,128,2,4,balanced,2.395253340403239
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,4096,1536,8,128,2,4,power_law_1.01,0.46752638816833497
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,4096,1536,8,128,2,4,power_law_1.01,0.14276479482650756
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,4096,1536,8,128,2,4,power_law_1.01,0.5018112182617187
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,4096,1536,8,128,2,4,power_law_1.01,0.16605440378189087
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,4096,1536,8,128,2,4,power_law_1.01,0.6847551822662353
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,4096,1536,8,128,2,4,power_law_1.01,0.1913472056388855
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,4096,1536,8,128,2,4,balanced,0.1518346667289734
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,4096,1536,8,128,2,4,balanced,0.5679893493652344
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,4096,1536,8,128,2,4,power_law_1.01,0.22101759910583496
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,4096,1536,8,128,2,4,power_law_1.01,0.9294079780578614
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,4096,1536,8,128,2,4,balanced,0.1758400003115336
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,4096,1536,8,128,2,4,power_law_1.01,0.28523519039154055
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,4096,1536,8,128,2,4,power_law_1.01,1.31658878326416
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,4096,1536,8,128,2,4,power_law_1.01,0.35916800498962403
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,4096,1536,8,128,2,4,balanced,0.18607999881108603
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,4096,1536,8,128,2,4,power_law_1.01,0.05084159970283508
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,4096,1536,8,128,2,4,power_law_1.01,1.7639999389648438
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,4096,1536,8,128,2,4,power_law_1.01,0.4195199966430664
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,4096,1536,8,128,2,4,balanced,0.24757333596547446
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,4096,1536,8,128,2,4,power_law_1.01,0.5685952186584473
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,4096,1536,8,128,2,4,power_law_1.01,0.04219520092010498
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,4096,1536,8,128,2,4,power_law_1.01,2.124710464477539
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,4096,1536,8,128,2,4,balanced,0.8353973229726156
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,4096,1536,8,128,2,4,power_law_1.01,0.7201087951660157
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,4096,1536,8,128,2,4,power_law_1.01,0.049670401215553286
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,4096,1536,8,128,2,4,balanced,0.29445334275563556
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,4096,1536,8,128,2,4,power_law_1.01,3.526438522338867
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,4096,1536,8,128,2,4,power_law_1.01,1.0091391563415528
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,4096,1536,8,128,2,4,power_law_1.01,0.06399359703063964
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,4096,1536,8,128,2,4,power_law_1.01,0.07870720028877258
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,4096,1536,8,128,2,4,power_law_1.01,1.3507328033447266
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,4096,1536,8,128,2,4,balanced,0.4437013467152913
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,4096,1536,8,128,2,4,power_law_1.01,7.5583740234375
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,4096,1536,8,128,2,4,power_law_1.01,0.09609599709510804
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,4096,1536,8,128,2,4,power_law_1.01,1.6541568756103515
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,4096,1536,8,128,2,4,power_law_1.01,0.10194560289382934
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,4096,1536,8,128,2,4,balanced,0.5226666529973348
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,4096,1536,8,128,2,4,power_law_1.01,2.8909759521484375
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,4096,1536,8,128,2,4,power_law_1.01,0.10531200170516967
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,4096,1536,8,128,2,4,power_law_1.01,0.10751359462738037
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,4096,1536,8,128,2,4,balanced,1.092570702234904
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,4096,1536,8,128,2,4,power_law_1.01,5.826240158081054
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,4096,1536,8,128,2,4,power_law_1.01,0.11738239526748658
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,4096,1536,8,128,2,4,balanced,0.7585439682006836
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,4096,1536,8,128,2,4,power_law_1.01,0.12282880544662475
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,4096,1536,8,128,2,4,power_law_1.01,0.13068159818649291
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,4096,1536,8,128,2,4,power_law_1.01,0.13905919790267945
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,4096,1536,8,128,2,4,power_law_1.01,0.15127040147781373
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,4096,1536,8,128,2,4,balanced,1.0041013558705647
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,4096,1536,8,128,2,4,power_law_1.01,0.15733120441436768
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,4096,1536,8,128,2,4,balanced,1.3554879824320476
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,4096,1536,8,128,2,4,balanced,4.705087979634603
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,4096,1536,8,128,2,4,power_law_1.01,0.1715008020401001
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,4096,1536,8,128,2,4,power_law_1.2,0.06209279894828797
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,4096,1536,8,128,2,4,balanced,1.4871360460917156
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,4096,1536,8,128,2,4,power_law_1.01,0.1806720018386841
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,4096,1536,8,128,2,4,power_law_1.2,0.04679679870605469
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,4096,1536,8,128,2,4,power_law_1.01,0.2031615972518921
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,4096,1536,8,128,2,4,power_law_1.2,0.06296319961547851
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,4096,1536,8,128,2,4,power_law_1.01,0.24428160190582277
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,4096,1536,8,128,2,4,power_law_1.2,0.07292159795761108
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,4096,1536,8,128,2,4,power_law_1.2,0.10124800205230713
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,4096,1536,8,128,2,4,power_law_1.01,0.35500800609588623
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,4096,1536,8,128,2,4,power_law_1.2,0.1566848039627075
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,4096,1536,8,128,2,4,power_law_1.01,0.44715518951416017
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,4096,1536,8,128,2,4,power_law_1.2,0.16143360137939453
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,4096,1536,8,128,2,4,power_law_1.01,0.5544447898864746
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,4096,1536,8,128,2,4,power_law_1.2,0.16128000020980834
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,4096,1536,8,128,2,4,balanced,1.9682025909423828
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,4096,1536,8,128,2,4,power_law_1.01,0.6780032157897949
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,4096,1536,8,128,2,4,power_law_1.2,0.1719231963157654
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,4096,1536,8,128,2,4,power_law_1.01,1.061894416809082
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,4096,1536,8,128,2,4,power_law_1.2,0.17573120594024658
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,4096,1536,8,128,2,4,power_law_1.2,0.18090879917144775
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,4096,1536,8,128,2,4,power_law_1.01,1.3203776359558106
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,4096,1536,8,128,2,4,balanced,2.084895928700765
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,4096,1536,8,128,2,4,power_law_1.2,0.17521920204162597
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,4096,1536,8,128,2,4,power_law_1.01,2.0706560134887697
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,4096,1536,8,128,2,4,power_law_1.2,0.19721599817276
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,4096,1536,8,128,2,4,power_law_1.01,2.5987455368041994
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,4096,1536,8,128,2,4,power_law_1.2,0.047040000557899475
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,4096,1536,8,128,2,4,power_law_1.2,0.19411840438842773
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,4096,1536,8,128,2,4,power_law_1.01,3.3761024475097656
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,4096,1536,8,128,2,4,power_law_1.2,0.2084415912628174
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,4096,1536,8,128,2,4,power_law_1.2,0.03697279989719391
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,4096,1536,8,128,2,4,power_law_1.2,0.22323839664459227
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,4096,1536,8,128,2,4,power_law_1.2,0.04657920002937317
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,4096,1536,8,128,2,4,power_law_1.01,4.851884841918945
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,4096,1536,8,128,2,4,balanced,2.4420960744222007
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,4096,1536,8,128,2,4,power_law_1.2,0.2238976001739502
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,4096,1536,8,128,2,4,power_law_1.2,0.05862399935722351
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,4096,1536,8,128,2,4,power_law_1.2,0.25201280117034913
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,4096,1536,8,128,2,4,power_law_1.2,0.07082880139350892
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,4096,1536,8,128,2,4,power_law_1.01,11.076959991455078
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,4096,1536,8,128,2,4,power_law_1.2,0.285478401184082
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,4096,1536,8,128,2,4,power_law_1.2,0.09669119715690613
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,4096,1536,8,128,2,4,power_law_1.2,0.09921280145645142
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,4096,1536,8,128,2,4,power_law_1.2,0.3328448057174683
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,4096,1536,8,128,2,4,power_law_1.2,0.10196479558944702
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,4096,1536,8,128,2,4,power_law_1.2,0.37907838821411133
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,4096,1536,8,128,2,4,power_law_1.2,0.10697599649429321
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,4096,1536,8,128,2,4,power_law_1.2,0.48073601722717285
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,4096,1536,8,128,2,4,power_law_1.2,0.10315519571304321
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,4096,1536,8,128,2,4,power_law_1.2,0.5158847808837891
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,4096,1536,8,128,2,4,power_law_1.2,0.11548800468444824
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,4096,1536,8,128,2,4,power_law_1.2,0.8170368194580078
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,4096,1536,8,128,2,4,power_law_1.2,0.1201024055480957
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,4096,1536,8,128,2,4,power_law_1.2,1.0364224433898925
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,4096,1536,8,128,2,4,power_law_1.2,0.12329599857330323
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,4096,1536,8,128,2,4,power_law_1.2,1.693017578125
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,4096,1536,8,128,2,4,power_law_1.2,0.12461440563201905
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,4096,1536,8,128,2,4,power_law_1.2,2.1069183349609375
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,4096,1536,8,128,2,4,power_law_1.2,0.13447680473327636
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,4096,1536,8,128,2,4,power_law_1.2,0.13699840307235717
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,4096,1536,8,128,2,4,balanced,3.864709218343099
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,4096,1536,8,128,2,4,power_law_1.2,2.5135936737060547
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,4096,1536,8,128,2,4,power_law_1.2,0.15261440277099608
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,4096,1536,8,128,2,4,power_law_1.2,0.17429120540618898
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,4096,1536,8,128,2,4,power_law_1.2,3.8566078186035155
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,4096,1536,8,128,2,4,power_law_1.2,0.20208640098571778
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,4096,1536,8,128,2,4,power_law_1.2,0.23761920928955077
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,4096,1536,8,128,2,4,power_law_1.2,9.24206085205078
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,4096,1536,8,128,2,4,power_law_1.2,0.304915189743042
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,4096,1536,8,128,2,4,power_law_1.2,0.38007678985595705
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,4096,1536,8,128,2,4,balanced,4.0546080271403
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,4096,1536,8,128,2,4,power_law_1.2,0.4476607799530029
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,4096,1536,8,128,2,4,power_law_1.2,0.6647168159484863
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,4096,1536,8,128,2,4,power_law_1.2,0.8665663719177246
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,4096,1536,8,128,2,4,power_law_1.2,1.2325440406799317
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,4096,1536,8,128,2,4,power_law_1.2,1.8255424499511719
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,4096,1536,8,128,2,4,power_law_1.2,2.0979583740234373
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,4096,1536,8,128,2,4,power_law_1.2,3.2362686157226563
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,4096,1536,8,128,2,4,power_law_1.2,7.172934722900391
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,4096,1536,8,128,2,4,balanced,7.677530924479167
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,4096,1536,8,128,2,4,power_law_1.2,0.050425601005554196
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,4096,1536,8,128,2,4,power_law_1.2,0.04154239892959595
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,4096,1536,8,128,2,4,power_law_1.2,0.052665597200393675
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,4096,1536,8,128,4,2,balanced,0.03917866696914037
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,4096,1536,8,128,2,4,power_law_1.2,0.05414400100708008
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,4096,1536,8,128,2,4,power_law_1.2,0.06716799736022949
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,4096,1536,8,128,4,2,balanced,0.04671466847260793
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,4096,1536,8,128,2,4,power_law_1.2,0.09904639720916748
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,4096,1536,8,128,4,2,balanced,0.06473066906134288
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,4096,1536,8,128,2,4,power_law_1.2,0.10188800096511841
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,4096,1536,8,128,4,2,balanced,0.1011306643486023
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,4096,1536,8,128,4,2,balanced,0.17567465702692667
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,4096,1536,8,128,2,4,power_law_1.2,0.10860799551010132
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,4096,1536,8,128,4,2,balanced,0.17781867583592734
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,4096,1536,8,128,2,4,power_law_1.2,0.11282559633255004
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,4096,1536,8,128,4,2,balanced,0.17696533600489298
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,4096,1536,8,128,2,4,power_law_1.2,0.11708159446716308
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,4096,1536,8,128,4,2,balanced,0.17573332786560059
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,4096,1536,8,128,4,2,balanced,0.0355679988861084
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,4096,1536,8,128,2,4,power_law_1.2,0.12714879512786864
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,4096,1536,8,128,4,2,balanced,0.17942933241526285
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,4096,1536,8,128,4,2,balanced,0.17839467525482178
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,4096,1536,8,128,2,4,power_law_1.2,0.13096959590911866
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,4096,1536,8,128,4,2,balanced,0.038405333956082664
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,4096,1536,8,128,4,2,balanced,0.1818986733754476
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,4096,1536,8,128,2,4,power_law_1.2,0.13903360366821288
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,4096,1536,8,128,4,2,balanced,0.05056533217430115
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,4096,1536,8,128,4,2,balanced,0.1845866640408834
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,4096,1536,8,128,2,4,power_law_1.2,0.1510655999183655
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,4096,1536,8,128,4,2,balanced,0.07398400207360585
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,4096,1536,8,128,4,2,balanced,0.18639467159907022
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,4096,1536,8,128,4,2,balanced,0.11382933457692464
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,4096,1536,8,128,4,2,balanced,0.1927093267440796
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,4096,1536,8,128,4,2,balanced,0.11568533380826314
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,4096,1536,8,128,2,4,power_law_1.2,0.16020480394363404
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,4096,1536,8,128,4,2,balanced,0.2007840077082316
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,4096,1536,8,128,4,2,balanced,0.11595732967058818
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,4096,1536,8,128,2,4,power_law_1.2,0.1720896005630493
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,4096,1536,8,128,4,2,balanced,0.20457067092259726
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,4096,1536,8,128,4,2,balanced,0.11565867066383362
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,4096,1536,8,128,4,2,balanced,0.11813867092132568
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,4096,1536,8,128,4,2,balanced,0.21755200624465942
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,4096,1536,8,128,4,2,balanced,0.11971732974052429
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,4096,1536,8,128,4,2,balanced,0.23269333442052206
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,4096,1536,8,128,2,4,power_law_1.2,0.17843199968338014
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,4096,1536,8,128,4,2,balanced,0.1207413375377655
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,4096,1536,8,128,4,2,balanced,0.2500586708386739
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,4096,1536,8,128,2,4,power_law_1.2,0.22753920555114746
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,4096,1536,8,128,4,2,balanced,0.1241919994354248
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,4096,1536,8,128,2,4,power_law_1.2,0.2537152051925659
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,4096,1536,8,128,4,2,balanced,0.1250986655553182
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,4096,1536,8,128,4,2,balanced,0.27987732489903766
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,4096,1536,8,128,4,2,balanced,0.12923733393351236
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,4096,1536,8,128,2,4,power_law_1.2,0.3838848114013672
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,4096,1536,8,128,4,2,balanced,0.13758400082588196
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,4096,1536,8,128,4,2,balanced,0.32285867134730023
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,4096,1536,8,128,2,4,power_law_1.2,0.4450496196746826
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,4096,1536,8,128,4,2,balanced,0.1421440045038859
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,4096,1536,8,128,2,4,power_law_1.2,0.5543424129486084
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,4096,1536,8,128,2,4,power_law_1.2,0.8118016242980957
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,4096,1536,8,128,4,2,balanced,0.15562666455904642
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,4096,1536,8,128,4,2,balanced,0.4018933375676473
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,4096,1536,8,128,2,4,power_law_1.2,1.1572928428649902
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,4096,1536,8,128,4,2,balanced,0.17409066359202066
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,4096,1536,8,128,2,4,power_law_1.2,1.6171136856079102
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,4096,1536,8,128,4,2,balanced,0.1921280026435852
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,4096,1536,8,128,4,2,balanced,0.46171732743581134
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,4096,1536,8,128,2,4,power_law_1.2,2.5036096572875977
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,4096,1536,8,128,4,2,balanced,0.22166933616002402
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,4096,1536,8,128,2,4,power_law_1.2,3.3099903106689452
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,4096,1536,8,128,2,4,power_law_1.2,4.326483154296875
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,4096,1536,8,128,4,2,balanced,0.2606400052706401
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,4096,1536,8,128,4,2,balanced,0.6689013640085856
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,4096,1536,8,128,2,4,power_law_1.2,7.153587341308594
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,4096,1536,8,128,4,2,balanced,0.35303465525309247
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,4096,1536,8,128,2,4,power_law_1.2,15.25524444580078
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,4096,1536,8,128,4,2,balanced,0.42590399583180744
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,4096,1536,8,128,4,2,balanced,0.8492586612701416
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,4096,1536,8,128,4,2,balanced,0.6257013479868571
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,4096,1536,8,128,4,2,balanced,0.045968001087506614
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,4096,1536,8,128,4,2,balanced,0.049141332507133484
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,4096,1536,8,128,4,2,balanced,1.2525920073191326
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,4096,1536,8,128,4,2,balanced,0.05714133381843567
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,4096,1536,8,128,4,2,balanced,0.07855466504891713
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,4096,1536,8,128,4,2,balanced,0.8061652978261312
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,4096,1536,8,128,4,2,balanced,0.11913067102432251
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,4096,1536,8,128,4,2,balanced,0.1220960021018982
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,4096,1536,8,128,4,2,balanced,0.12424533565839131
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,4096,1536,8,128,4,2,balanced,0.1253973344961802
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,4096,1536,8,128,4,2,balanced,0.1267466644446055
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,4096,1536,8,128,4,2,balanced,0.13036800424257913
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,4096,1536,8,128,4,2,balanced,0.13446933031082153
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,4096,1536,8,128,4,2,balanced,0.13994133472442627
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,4096,1536,8,128,4,2,balanced,1.1938239733378093
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,4096,1536,8,128,4,2,balanced,1.6529547373453777
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,4096,1536,8,128,4,2,power_law_1.01,0.04636160135269165
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,4096,1536,8,128,4,2,balanced,0.14510400096575418
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,4096,1536,8,128,4,2,balanced,0.15079466501871744
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,4096,1536,8,128,4,2,power_law_1.01,0.04177280068397522
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,4096,1536,8,128,4,2,power_law_1.01,0.05489919781684875
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,4096,1536,8,128,4,2,power_law_1.01,0.07596160173416137
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,4096,1536,8,128,4,2,power_law_1.01,0.09873920083045959
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,4096,1536,8,128,4,2,power_law_1.01,0.15110399723052978
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,4096,1536,8,128,4,2,balanced,0.16866666078567505
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,4096,1536,8,128,4,2,power_law_1.01,0.1582208037376404
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,4096,1536,8,128,4,2,balanced,1.5602773030598958
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,4096,1536,8,128,4,2,balanced,0.1720106601715088
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,4096,1536,8,128,4,2,power_law_1.01,0.03837440013885498
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,4096,1536,8,128,4,2,power_law_1.01,0.16291199922561644
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,4096,1536,8,128,4,2,balanced,2.0651572545369468
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,4096,1536,8,128,4,2,power_law_1.01,0.17073919773101806
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,4096,1536,8,128,4,2,power_law_1.01,0.038822400569915774
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,4096,1536,8,128,4,2,power_law_1.01,0.17727359533309936
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,4096,1536,8,128,4,2,power_law_1.01,0.04431360065937042
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,4096,1536,8,128,4,2,power_law_1.01,0.17998720407485963
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,4096,1536,8,128,4,2,power_law_1.01,0.06496639847755432
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,4096,1536,8,128,4,2,power_law_1.01,0.07262719869613647
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,4096,1536,8,128,4,2,power_law_1.01,0.19549440145492553
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,4096,1536,8,128,4,2,balanced,0.20244266589482626
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,4096,1536,8,128,4,2,power_law_1.01,0.10138880014419556
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,4096,1536,8,128,4,2,power_law_1.01,0.19453439712524415
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,4096,1536,8,128,4,2,power_law_1.01,0.10453120470046998
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,4096,1536,8,128,4,2,balanced,0.24461867411931357
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,4096,1536,8,128,4,2,power_law_1.01,0.19921280145645143
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,4096,1536,8,128,4,2,power_law_1.01,0.10826879739761353
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,4096,1536,8,128,4,2,balanced,1.9601066907246907
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,4096,1536,8,128,4,2,balanced,0.27875733375549316
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,4096,1536,8,128,4,2,power_law_1.01,0.2185215950012207
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,4096,1536,8,128,4,2,power_law_1.01,0.11418880224227905
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,4096,1536,8,128,4,2,power_law_1.01,0.04597119987010956
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,4096,1536,8,128,4,2,power_law_1.01,0.22747519016265869
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,4096,1536,8,128,4,2,power_law_1.01,0.11632640361785888
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,4096,1536,8,128,4,2,balanced,0.3876533508300781
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,4096,1536,8,128,4,2,power_law_1.01,0.05052800178527832
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,4096,1536,8,128,4,2,power_law_1.01,0.12190719842910766
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,4096,1536,8,128,4,2,power_law_1.01,0.22422399520874023
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,4096,1536,8,128,4,2,power_law_1.01,0.05389440059661865
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,4096,1536,8,128,4,2,power_law_1.01,0.12877440452575684
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,4096,1536,8,128,4,2,power_law_1.01,0.2625663995742798
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,4096,1536,8,128,4,2,balanced,0.4517120122909546
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,4096,1536,8,128,4,2,power_law_1.01,0.07416960000991821
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,4096,1536,8,128,4,2,power_law_1.01,0.1338752031326294
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,4096,1536,8,128,4,2,power_law_1.01,0.28222079277038575
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,4096,1536,8,128,4,2,power_law_1.01,0.0840063989162445
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,4096,1536,8,128,4,2,power_law_1.01,0.13760639429092408
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,4096,1536,8,128,4,2,balanced,3.1586879094441733
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,4096,1536,8,128,4,2,power_law_1.01,0.35260159969329835
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,4096,1536,8,128,4,2,balanced,0.6832746664683024
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,4096,1536,8,128,4,2,power_law_1.01,0.10773760080337524
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,4096,1536,8,128,4,2,power_law_1.01,0.14410879611968994
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,4096,1536,8,128,4,2,power_law_1.01,0.39328000545501707
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,4096,1536,8,128,4,2,power_law_1.01,0.1575744032859802
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,4096,1536,8,128,4,2,power_law_1.01,0.11653759479522705
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,4096,1536,8,128,4,2,power_law_1.2,0.04455040097236633
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,4096,1536,8,128,4,2,power_law_1.01,0.5020991802215576
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,4096,1536,8,128,4,2,power_law_1.01,0.16709760427474976
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,4096,1536,8,128,4,2,power_law_1.01,0.12122880220413208
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,4096,1536,8,128,4,2,balanced,0.8227946758270264
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,4096,1536,8,128,4,2,power_law_1.2,0.04193280041217804
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,4096,1536,8,128,4,2,power_law_1.01,0.19780479669570922
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,4096,1536,8,128,4,2,power_law_1.01,0.5693888187408447
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,4096,1536,8,128,4,2,power_law_1.01,0.12686079740524292
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,4096,1536,8,128,4,2,power_law_1.2,0.05464959740638733
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,4096,1536,8,128,4,2,power_law_1.01,0.21377279758453369
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,4096,1536,8,128,4,2,power_law_1.01,0.1313088059425354
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,4096,1536,8,128,4,2,power_law_1.01,0.796563196182251
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,4096,1536,8,128,4,2,power_law_1.2,0.07412480115890503
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,4096,1536,8,128,4,2,power_law_1.01,0.26705920696258545
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,4096,1536,8,128,4,2,power_law_1.01,0.14177279472351073
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,4096,1536,8,128,4,2,balanced,1.2094240188598633
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,4096,1536,8,128,4,2,power_law_1.01,0.9837887763977051
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,4096,1536,8,128,4,2,balanced,2.9978240331014
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,4096,1536,8,128,4,2,power_law_1.2,0.09129599928855896
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,4096,1536,8,128,4,2,power_law_1.01,0.31543679237365724
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,4096,1536,8,128,4,2,power_law_1.01,0.14895999431610107
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,4096,1536,8,128,4,2,power_law_1.01,1.4225215911865234
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,4096,1536,8,128,4,2,power_law_1.2,0.1484544038772583
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,4096,1536,8,128,4,2,power_law_1.01,0.16486400365829468
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,4096,1536,8,128,4,2,power_law_1.01,0.42654080390930177
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,4096,1536,8,128,4,2,power_law_1.2,0.1577280044555664
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,4096,1536,8,128,4,2,power_law_1.01,0.17816319465637206
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,4096,1536,8,128,4,2,power_law_1.01,1.8874048233032226
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,4096,1536,8,128,4,2,power_law_1.01,0.5251584053039551
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,4096,1536,8,128,4,2,power_law_1.2,0.16636799573898314
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,4096,1536,8,128,4,2,power_law_1.01,0.6952896118164062
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,4096,1536,8,128,4,2,balanced,1.6001332600911458
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,4096,1536,8,128,4,2,power_law_1.01,2.2357311248779297
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,4096,1536,8,128,4,2,power_law_1.2,0.17770880460739136
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,4096,1536,8,128,4,2,power_law_1.01,0.9138367652893067
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,4096,1536,8,128,4,2,power_law_1.01,0.19182080030441284
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,4096,1536,8,128,4,2,power_law_1.01,4.039481735229492
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,4096,1536,8,128,4,2,power_law_1.2,0.1804159998893738
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,4096,1536,8,128,4,2,power_law_1.01,1.2524352073669434
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,4096,1536,8,128,4,2,power_law_1.01,0.2127232074737549
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,4096,1536,8,128,4,2,power_law_1.2,0.1839679956436157
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,4096,1536,8,128,4,2,power_law_1.01,1.6190719604492188
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,4096,1536,8,128,4,2,power_law_1.01,7.144895935058594
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,4096,1536,8,128,4,2,power_law_1.2,0.1906623959541321
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,4096,1536,8,128,4,2,power_law_1.01,0.21377921104431152
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,4096,1536,8,128,4,2,power_law_1.01,2.1610176086425783
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,4096,1536,8,128,4,2,power_law_1.2,0.19428479671478271
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,4096,1536,8,128,4,2,balanced,2.376842657725016
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,4096,1536,8,128,4,2,power_law_1.01,0.284332799911499
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,4096,1536,8,128,4,2,power_law_1.2,0.20222079753875732
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,4096,1536,8,128,4,2,power_law_1.01,3.3331199645996095
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,4096,1536,8,128,4,2,power_law_1.01,0.34936959743499757
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,4096,1536,8,128,4,2,power_law_1.2,0.2169408082962036
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,4096,1536,8,128,4,2,power_law_1.01,0.45269122123718264
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,4096,1536,8,128,4,2,power_law_1.2,0.22899839878082276
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,4096,1536,8,128,4,2,power_law_1.01,7.154310607910157
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,4096,1536,8,128,4,2,power_law_1.01,0.5598015785217285
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,4096,1536,8,128,4,2,power_law_1.2,0.23783679008483888
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,4096,1536,8,128,4,2,power_law_1.01,0.7650815963745117
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,4096,1536,8,128,4,2,power_law_1.2,0.273638391494751
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,4096,1536,8,128,4,2,power_law_1.01,0.9438207626342774
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,4096,1536,8,128,4,2,power_law_1.2,0.2882303953170776
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,4096,1536,8,128,4,2,balanced,3.138970692952474
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,4096,1536,8,128,4,2,power_law_1.01,1.3876480102539062
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,4096,1536,8,128,4,2,power_law_1.2,0.3371968030929565
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,4096,1536,8,128,4,2,balanced,6.219519933064778
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,4096,1536,8,128,4,2,power_law_1.01,1.8557184219360352
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,4096,1536,8,128,4,2,power_law_1.2,0.44272642135620116
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,4096,1536,8,128,4,2,power_law_1.01,2.611942481994629
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,4096,1536,8,128,4,2,power_law_1.2,0.5187136173248291
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,4096,1536,8,128,4,2,power_law_1.2,0.5785088062286377
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,4096,1536,8,128,4,2,power_law_1.01,3.5943744659423826
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,4096,1536,8,128,4,2,power_law_1.2,0.8106304168701172
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,4096,1536,8,128,4,2,power_law_1.01,4.6889598846435545
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,4096,1536,8,128,4,2,power_law_1.2,1.0466431617736816
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,4096,1536,8,128,4,2,balanced,5.84121576944987
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,4096,1536,8,128,4,2,power_law_1.01,6.960249328613282
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,4096,1536,8,128,4,2,power_law_1.2,1.6390592575073242
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,4096,1536,8,128,4,2,balanced,3.8954238891601562
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,4096,1536,8,128,4,2,power_law_1.2,1.8570175170898438
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,4096,1536,8,128,4,2,power_law_1.01,13.882777404785156
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,4096,1536,8,128,4,2,power_law_1.2,2.5850879669189455
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,4096,1536,8,128,4,2,power_law_1.2,3.96044807434082
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,4096,1536,8,128,4,2,power_law_1.2,8.05973129272461
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,4096,1536,8,128,4,2,power_law_1.2,0.037510401010513304
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,4096,1536,8,128,4,2,power_law_1.2,0.03869439959526062
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,4096,1536,8,128,4,2,balanced,6.172400156656901
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,4096,1536,8,128,4,2,power_law_1.2,0.045184001326560974
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,4096,1536,8,128,4,2,power_law_1.2,0.057120001316070555
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,4096,1536,8,128,4,2,power_law_1.2,0.07192320227622986
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,4096,1536,8,128,4,2,power_law_1.2,0.10216959714889526
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,4096,1536,8,128,4,2,power_law_1.2,0.1049280047416687
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,4096,1536,8,128,4,2,power_law_1.2,0.10874240398406983
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,4096,1536,8,128,4,2,power_law_1.2,0.11591039896011353
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,4096,1536,8,128,4,2,power_law_1.2,0.11520639657974244
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,4096,1536,8,128,4,2,power_law_1.2,0.12318719625473022
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,4096,1536,8,128,4,2,power_law_1.2,0.1327679991722107
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,4096,1536,8,128,4,2,power_law_1.2,0.1383039951324463
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,4096,1536,8,128,4,2,power_law_1.2,0.1368191957473755
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,4096,1536,8,128,4,2,power_law_1.2,0.15374079942703248
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,4096,1536,8,128,4,2,power_law_1.2,0.15821440219879152
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,4096,1536,8,128,4,2,power_law_1.2,0.17541120052337647
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,4096,1536,8,128,4,2,power_law_1.2,0.19578880071640015
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,4096,1536,8,128,4,2,power_law_1.2,0.21663360595703124
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,4096,1536,8,128,4,2,power_law_1.2,0.2651648044586182
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,4096,1536,8,128,4,2,power_law_1.2,0.3251391887664795
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,4096,1536,8,128,4,2,power_law_1.2,0.41532158851623535
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,4096,1536,8,128,4,2,power_law_1.2,0.5052288055419922
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,4096,1536,8,128,4,2,power_law_1.2,0.6972288131713867
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,4096,1536,8,128,4,2,balanced,12.212139129638672
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,4096,1536,8,128,4,2,power_law_1.2,0.9805503845214844
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,4096,1536,8,128,4,2,power_law_1.2,1.3640640258789063
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,4096,1536,8,128,4,2,power_law_1.2,1.8223743438720703
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,4096,1536,8,128,4,2,power_law_1.2,2.1387008666992187
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,4096,1536,8,128,4,2,power_law_1.2,4.060595321655273
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,4096,1536,8,128,4,2,power_law_1.2,8.216595458984376
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,4096,1536,8,128,4,2,power_law_1.2,0.04647679924964905
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,4096,1536,8,128,4,2,power_law_1.2,0.04930559992790222
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,4096,1536,8,128,4,2,power_law_1.2,0.051974397897720334
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,4096,1536,8,128,4,2,power_law_1.2,0.06520320177078247
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,4096,1536,8,128,4,2,power_law_1.2,0.0785535991191864
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,4096,1536,8,128,8,1,balanced,0.04163199911514918
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,4096,1536,8,128,4,2,power_law_1.2,0.10988160371780395
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,4096,1536,8,128,8,1,balanced,0.05183466772238413
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,4096,1536,8,128,4,2,power_law_1.2,0.11436799764633179
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,4096,1536,8,128,8,1,balanced,0.06926933427651723
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,4096,1536,8,128,4,2,power_law_1.2,0.12182400226593018
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,4096,1536,8,128,8,1,balanced,0.10946666200955708
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,4096,1536,8,128,4,2,power_law_1.2,0.13034240007400513
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,4096,1536,8,128,8,1,balanced,0.19323732455571493
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,4096,1536,8,128,4,2,power_law_1.2,0.1301375985145569
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,4096,1536,8,128,8,1,balanced,0.19137599070866904
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,4096,1536,8,128,4,2,power_law_1.2,0.1422719955444336
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,4096,1536,8,128,8,1,balanced,0.1909760038057963
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,4096,1536,8,128,8,1,balanced,0.03812800099452337
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,4096,1536,8,128,4,2,power_law_1.2,0.15518720149993898
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,4096,1536,8,128,8,1,balanced,0.19307732582092285
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,4096,1536,8,128,4,2,power_law_1.2,0.16328320503234864
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,4096,1536,8,128,8,1,balanced,0.04327466587225596
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,4096,1536,8,128,8,1,balanced,0.19425066312154135
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,4096,1536,8,128,8,1,balanced,0.058965335289637245
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,4096,1536,8,128,4,2,power_law_1.2,0.1854143977165222
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,4096,1536,8,128,8,1,balanced,0.19390400250752768
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,4096,1536,8,128,8,1,balanced,0.196943998336792
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,4096,1536,8,128,8,1,balanced,0.0860053300857544
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,4096,1536,8,128,8,1,balanced,0.20163200298945108
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,4096,1536,8,128,8,1,balanced,0.13317867120107016
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,4096,1536,8,128,4,2,power_law_1.2,0.19833600521087646
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,4096,1536,8,128,8,1,balanced,0.1358453333377838
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,4096,1536,8,128,8,1,balanced,0.2053813338279724
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,4096,1536,8,128,4,2,power_law_1.2,0.2119296073913574
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,4096,1536,8,128,8,1,balanced,0.13664000233014426
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,4096,1536,8,128,8,1,balanced,0.2062399983406067
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,4096,1536,8,128,8,1,balanced,0.13713600238164267
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,4096,1536,8,128,8,1,balanced,0.22396800915400186
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,4096,1536,8,128,8,1,power_law_1.01,0.04036479890346527
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,4096,1536,8,128,4,2,power_law_1.2,0.22355198860168457
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,4096,1536,8,128,8,1,balanced,0.14125333229700723
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,4096,1536,8,128,8,1,balanced,0.23187732696533203
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,4096,1536,8,128,8,1,power_law_1.01,0.04442879855632782
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,4096,1536,8,128,4,2,power_law_1.2,0.27727999687194826
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,4096,1536,8,128,8,1,balanced,0.1425493359565735
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,4096,1536,8,128,8,1,balanced,0.2569813330968221
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,4096,1536,8,128,8,1,power_law_1.01,0.06038399934768677
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,4096,1536,8,128,8,1,balanced,0.14679466684659323
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,4096,1536,8,128,4,2,power_law_1.2,0.36348159313201905
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,4096,1536,8,128,8,1,balanced,0.2874506711959839
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,4096,1536,8,128,8,1,power_law_1.01,0.07665280103683472
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,4096,1536,8,128,8,1,balanced,0.14907733599344888
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,4096,1536,8,128,4,2,power_law_1.2,0.48810877799987795
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,4096,1536,8,128,8,1,power_law_1.01,0.10021120309829712
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,4096,1536,8,128,8,1,balanced,0.31113600730895996
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,4096,1536,8,128,8,1,balanced,0.15262400110562643
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,4096,1536,8,128,4,2,power_law_1.2,0.6191552162170411
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,4096,1536,8,128,8,1,power_law_1.01,0.16465920209884644
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,4096,1536,8,128,8,1,balanced,0.3564053376515706
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,4096,1536,8,128,8,1,balanced,0.1609173317750295
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,4096,1536,8,128,4,2,power_law_1.2,0.7938111782073974
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,4096,1536,8,128,8,1,power_law_1.01,0.03585279881954193
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,4096,1536,8,128,8,1,power_law_1.01,0.17486079931259155
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,4096,1536,8,128,8,1,balanced,0.06780800223350525
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,4096,1536,8,128,8,1,balanced,0.17332265774408975
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,4096,1536,8,128,8,1,power_law_1.01,0.1830464005470276
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,4096,1536,8,128,8,1,balanced,0.07180800040562947
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,4096,1536,8,128,4,2,power_law_1.2,1.002246379852295
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,4096,1536,8,128,8,1,balanced,0.3933653434117635
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,4096,1536,8,128,8,1,power_law_1.01,0.03885439932346344
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,4096,1536,8,128,8,1,balanced,0.07986666758855183
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,4096,1536,8,128,8,1,balanced,0.18126932779947916
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,4096,1536,8,128,8,1,power_law_1.01,0.18322559595108032
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,4096,1536,8,128,8,1,power_law_1.01,0.05008640289306641
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,4096,1536,8,128,4,2,power_law_1.2,1.4531007766723634
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,4096,1536,8,128,8,1,balanced,0.10572266578674316
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,4096,1536,8,128,8,1,power_law_1.01,0.18986239433288574
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,4096,1536,8,128,8,1,balanced,0.1550986667474111
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,4096,1536,8,128,8,1,balanced,0.20739734172821045
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,4096,1536,8,128,8,1,power_law_1.01,0.06755840182304382
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,4096,1536,8,128,8,1,balanced,0.5777759949366251
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,4096,1536,8,128,8,1,balanced,0.1609173317750295
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,4096,1536,8,128,4,2,power_law_1.2,2.0634176254272463
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,4096,1536,8,128,8,1,power_law_1.01,0.20403199195861815
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,4096,1536,8,128,8,1,power_law_1.01,0.0804095983505249
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,4096,1536,8,128,8,1,balanced,0.16356266538302103
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,4096,1536,8,128,8,1,balanced,0.2414240042368571
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,4096,1536,8,128,8,1,power_law_1.01,0.22210559844970704
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,4096,1536,8,128,8,1,balanced,0.16883732875188193
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,4096,1536,8,128,4,2,power_law_1.2,2.6110208511352537
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,4096,1536,8,128,8,1,power_law_1.01,0.11841919422149658
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,4096,1536,8,128,8,1,balanced,0.17111466328303018
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,4096,1536,8,128,8,1,balanced,0.6921119689941406
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,4096,1536,8,128,8,1,balanced,0.26394132773081463
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,4096,1536,8,128,8,1,power_law_1.01,0.22855679988861083
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,4096,1536,8,128,8,1,power_law_1.01,0.12236160039901733
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,4096,1536,8,128,8,1,balanced,0.17628800868988037
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,4096,1536,8,128,4,2,power_law_1.2,4.129062271118164
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,4096,1536,8,128,8,1,balanced,0.1825760006904602
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,4096,1536,8,128,8,1,power_law_1.01,0.22386560440063477
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,4096,1536,8,128,8,1,power_law_1.01,0.12791680097579955
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,4096,1536,8,128,8,1,balanced,0.31785066922505695
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,4096,1536,8,128,8,1,balanced,0.19290133317311606
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,4096,1536,8,128,4,2,power_law_1.2,4.673766326904297
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,4096,1536,8,128,8,1,power_law_1.01,0.1371072053909302
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,4096,1536,8,128,8,1,power_law_1.01,0.2352384090423584
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,4096,1536,8,128,8,1,balanced,0.20104533433914185
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,4096,1536,8,128,8,1,balanced,1.0276959737141926
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,4096,1536,8,128,8,1,power_law_1.01,0.2554368019104004
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,4096,1536,8,128,8,1,balanced,0.2107413411140442
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,4096,1536,8,128,8,1,power_law_1.01,0.14039039611816406
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,4096,1536,8,128,8,1,balanced,0.36217065652211505
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,4096,1536,8,128,4,2,power_law_1.2,7.645132446289063
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,4096,1536,8,128,8,1,power_law_1.01,0.14731520414352417
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,4096,1536,8,128,8,1,power_law_1.01,0.27263360023498534
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,4096,1536,8,128,8,1,power_law_1.01,0.1576640009880066
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,4096,1536,8,128,8,1,power_law_1.01,0.3226624011993408
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,4096,1536,8,128,8,1,balanced,0.5395626624425253
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,4096,1536,8,128,4,2,power_law_1.2,15.610528564453125
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,4096,1536,8,128,8,1,power_law_1.01,0.16629120111465454
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,4096,1536,8,128,8,1,power_law_1.01,0.34223361015319825
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,4096,1536,8,128,8,1,balanced,0.24303466081619263
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,4096,1536,8,128,8,1,balanced,1.2944213549296062
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,4096,1536,8,128,8,1,power_law_1.01,0.17022720575332642
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,4096,1536,8,128,8,1,power_law_1.01,0.4226560115814209
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,4096,1536,8,128,8,1,balanced,0.25150400400161743
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,4096,1536,8,128,8,1,power_law_1.01,0.18394880294799804
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,4096,1536,8,128,8,1,balanced,0.6473653316497803
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,4096,1536,8,128,8,1,power_law_1.01,0.4908160209655762
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,4096,1536,8,128,8,1,power_law_1.01,0.20067200660705567
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,4096,1536,8,128,8,1,power_law_1.01,0.6449408054351806
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,4096,1536,8,128,8,1,power_law_1.01,0.2229696035385132
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,4096,1536,8,128,8,1,power_law_1.01,0.7943808078765869
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,4096,1536,8,128,8,1,power_law_1.01,0.2684927940368652
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,4096,1536,8,128,8,1,balanced,1.002127965291341
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,4096,1536,8,128,8,1,power_law_1.01,1.1078656196594239
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,4096,1536,8,128,8,1,power_law_1.01,0.2934272050857544
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,4096,1536,8,128,8,1,balanced,0.32153600454330444
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,4096,1536,8,128,8,1,balanced,1.9184746742248535
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,4096,1536,8,128,8,1,power_law_1.01,1.3683584213256836
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,4096,1536,8,128,8,1,power_law_1.01,0.3551743984222412
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,4096,1536,8,128,8,1,balanced,0.4158613284428914
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,4096,1536,8,128,8,1,power_law_1.01,1.9305343627929688
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,4096,1536,8,128,8,1,power_law_1.01,0.4375616073608398
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,4096,1536,8,128,8,1,balanced,0.45443201065063477
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,4096,1536,8,128,8,1,power_law_1.01,0.5883456230163574
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,4096,1536,8,128,8,1,power_law_1.01,2.516326332092285
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,4096,1536,8,128,8,1,balanced,1.3289546966552734
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,4096,1536,8,128,8,1,balanced,0.6497546831766764
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,4096,1536,8,128,8,1,power_law_1.01,0.71877121925354
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,4096,1536,8,128,8,1,power_law_1.01,3.0988544464111327
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,4096,1536,8,128,8,1,power_law_1.01,1.0129216194152832
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,4096,1536,8,128,8,1,balanced,0.7725173632303873
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,4096,1536,8,128,8,1,power_law_1.01,4.866131210327149
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,4096,1536,8,128,8,1,power_law_1.01,1.314246368408203
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,4096,1536,8,128,8,1,balanced,1.1928266684214275
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,4096,1536,8,128,8,1,balanced,2.5559093157450357
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,4096,1536,8,128,8,1,power_law_1.01,1.937164878845215
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,4096,1536,8,128,8,1,power_law_1.01,10.277177429199218
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,4096,1536,8,128,8,1,power_law_1.01,2.5662527084350586
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,4096,1536,8,128,8,1,balanced,1.9904534022013347
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,4096,1536,8,128,8,1,balanced,1.4618186950683594
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,4096,1536,8,128,8,1,power_law_1.01,3.173004722595215
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,4096,1536,8,128,8,1,power_law_1.01,5.001548767089844
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,4096,1536,8,128,8,1,power_law_1.01,0.058982402086257935
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,4096,1536,8,128,8,1,balanced,2.154266675313314
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,4096,1536,8,128,8,1,power_law_1.01,10.30187530517578
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,4096,1536,8,128,8,1,power_law_1.01,0.06859520077705383
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,4096,1536,8,128,8,1,power_law_1.01,0.07665280103683472
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,4096,1536,8,128,8,1,power_law_1.2,0.04067200124263763
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,4096,1536,8,128,8,1,balanced,2.6258079210917153
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,4096,1536,8,128,8,1,power_law_1.01,0.08971520066261292
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,4096,1536,8,128,8,1,balanced,3.2151412963867188
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,4096,1536,8,128,8,1,balanced,2.831535975138346
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,4096,1536,8,128,8,1,power_law_1.01,0.1034816026687622
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,4096,1536,8,128,8,1,power_law_1.2,0.04411520063877106
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,4096,1536,8,128,8,1,power_law_1.01,0.14327679872512816
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,4096,1536,8,128,8,1,power_law_1.2,0.06079999804496765
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,4096,1536,8,128,8,1,power_law_1.01,0.14820480346679688
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,4096,1536,8,128,8,1,power_law_1.2,0.0754688024520874
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,4096,1536,8,128,8,1,power_law_1.01,0.15495680570602416
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,4096,1536,8,128,8,1,power_law_1.2,0.0953984022140503
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,4096,1536,8,128,8,1,balanced,4.1911360422770185
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,4096,1536,8,128,8,1,power_law_1.01,0.16545920372009276
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,4096,1536,8,128,8,1,power_law_1.2,0.16505600214004518
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,4096,1536,8,128,8,1,power_law_1.01,0.17787519693374634
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,4096,1536,8,128,8,1,power_law_1.2,0.1730239987373352
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,4096,1536,8,128,8,1,power_law_1.2,0.18495999574661254
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,4096,1536,8,128,8,1,power_law_1.01,0.18855680227279664
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,4096,1536,8,128,8,1,balanced,3.2919092178344727
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,4096,1536,8,128,8,1,power_law_1.01,0.20424320697784423
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,4096,1536,8,128,8,1,power_law_1.2,0.18950400352478028
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,4096,1536,8,128,8,1,power_law_1.2,0.19781119823455812
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,4096,1536,8,128,8,1,power_law_1.01,0.21946239471435547
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,4096,1536,8,128,8,1,power_law_1.2,0.20759038925170897
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,4096,1536,8,128,8,1,power_law_1.01,0.245580792427063
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,4096,1536,8,128,8,1,balanced,5.572549184163411
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,4096,1536,8,128,8,1,power_law_1.2,0.2236543893814087
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,4096,1536,8,128,8,1,balanced,4.8240000406901045
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,4096,1536,8,128,8,1,power_law_1.2,0.23707520961761475
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,4096,1536,8,128,8,1,power_law_1.01,0.2635456085205078
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,4096,1536,8,128,8,1,power_law_1.2,0.22577919960021972
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,4096,1536,8,128,8,1,power_law_1.01,0.286297607421875
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,4096,1536,8,128,8,1,power_law_1.2,0.24036478996276855
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,4096,1536,8,128,8,1,power_law_1.2,0.2605247974395752
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,4096,1536,8,128,8,1,power_law_1.2,0.2767807960510254
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,4096,1536,8,128,8,1,power_law_1.01,0.32663679122924805
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,4096,1536,8,128,8,1,power_law_1.2,0.32702078819274905
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,4096,1536,8,128,8,1,power_law_1.01,0.4300223827362061
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,4096,1536,8,128,8,1,power_law_1.2,0.3535680055618286
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,4096,1536,8,128,8,1,power_law_1.01,0.5095935821533203
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,4096,1536,8,128,8,1,balanced,6.930304209391276
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,4096,1536,8,128,8,1,power_law_1.2,0.4273536205291748
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,4096,1536,8,128,8,1,power_law_1.01,0.689740800857544
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,4096,1536,8,128,8,1,balanced,4.946672121683757
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,4096,1536,8,128,8,1,power_law_1.2,0.4955904006958008
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,4096,1536,8,128,8,1,power_law_1.01,0.85863037109375
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,4096,1536,8,128,8,1,power_law_1.2,0.647654390335083
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,4096,1536,8,128,8,1,power_law_1.01,1.190272045135498
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,4096,1536,8,128,8,1,power_law_1.2,0.8030655860900879
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,4096,1536,8,128,8,1,power_law_1.01,1.5158656120300293
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,4096,1536,8,128,8,1,power_law_1.2,1.1270591735839843
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,4096,1536,8,128,8,1,power_law_1.2,1.3902463912963867
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,4096,1536,8,128,8,1,power_law_1.01,2.1960895538330076
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,4096,1536,8,128,8,1,power_law_1.2,1.965235137939453
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,4096,1536,8,128,8,1,power_law_1.01,2.8787839889526365
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,4096,1536,8,128,8,1,power_law_1.2,2.5261760711669923
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,4096,1536,8,128,8,1,power_law_1.01,4.237766265869141
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,4096,1536,8,128,8,1,power_law_1.2,3.130092811584473
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,4096,1536,8,128,8,1,power_law_1.01,5.591487884521484
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,4096,1536,8,128,8,1,power_law_1.2,5.150451278686523
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,4096,1536,8,128,8,1,power_law_1.01,6.941407775878906
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,4096,1536,8,128,8,1,balanced,11.011690775553385
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,4096,1536,8,128,8,1,power_law_1.2,10.343520355224609
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,4096,1536,8,128,8,1,power_law_1.01,10.999411010742188
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,4096,1536,8,128,8,1,power_law_1.01,21.834501647949217
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,4096,1536,8,128,8,1,balanced,9.70310910542806
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,4096,1536,8,128,8,1,balanced,9.728495915730795
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,4096,1536,8,128,8,1,power_law_1.2,0.037196800112724304
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,4096,1536,8,128,8,1,power_law_1.2,0.04004479944705963
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,4096,1536,8,128,8,1,power_law_1.2,0.04881280064582825
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,4096,1536,8,128,8,1,power_law_1.2,0.06316159963607788
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,4096,1536,8,128,8,1,power_law_1.2,0.07524480223655701
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,4096,1536,8,128,8,1,power_law_1.2,0.11980799436569214
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,4096,1536,8,128,8,1,power_law_1.2,0.12421120405197143
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,4096,1536,8,128,8,1,balanced,21.908841451009113
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,4096,1536,8,128,8,1,power_law_1.2,0.1341248035430908
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,4096,1536,8,128,8,1,power_law_1.2,0.13865599632263184
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,4096,1536,8,128,8,1,power_law_1.2,0.14177919626235963
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,4096,1536,8,128,8,1,power_law_1.2,0.15166079998016357
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,4096,1536,8,128,8,1,power_law_1.2,0.16090240478515624
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,4096,1536,8,128,8,1,power_law_1.2,0.17315200567245484
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,4096,1536,8,128,8,1,power_law_1.2,0.1718016028404236
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,4096,1536,8,128,8,1,power_law_1.2,0.18826240301132202
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,4096,1536,8,128,8,1,power_law_1.2,0.05885440111160278
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,4096,1536,8,128,8,1,power_law_1.2,0.20086400508880614
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,4096,1536,8,128,8,1,power_law_1.2,0.07014399766921997
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,4096,1536,8,128,8,1,power_law_1.2,0.22505600452423097
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,4096,1536,8,128,8,1,power_law_1.2,0.07464320063591004
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,4096,1536,8,128,8,1,power_law_1.2,0.27073280811309813
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,6144,2560,8,160,1,8,balanced,0.07454399764537811
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,4096,1536,8,128,8,1,power_law_1.2,0.08494719862937927
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,4096,1536,8,128,8,1,power_law_1.2,0.2992511987686157
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,6144,2560,8,160,1,8,balanced,0.08699733018875122
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,4096,1536,8,128,8,1,power_law_1.2,0.09969279766082764
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,6144,2560,8,160,1,8,balanced,0.12894933422406515
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,4096,1536,8,128,8,1,power_law_1.2,0.3621056079864502
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,6144,2560,8,160,1,8,balanced,0.22175999482472739
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,4096,1536,8,128,8,1,power_law_1.2,0.13963520526885986
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,4096,1536,8,128,8,1,power_law_1.2,0.4401599884033203
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,6144,2560,8,160,1,8,balanced,0.3908640146255493
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,6144,2560,8,160,1,8,balanced,0.48098134994506836
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,4096,1536,8,128,8,1,power_law_1.2,0.1512511968612671
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,4096,1536,8,128,8,1,power_law_1.2,0.5875967979431153
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,6144,2560,8,160,1,8,balanced,0.4843680063883464
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,4096,1536,8,128,8,1,power_law_1.2,0.15941760540008545
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,6144,2560,8,160,1,8,balanced,0.48429866631825763
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,4096,1536,8,128,8,1,power_law_1.2,0.7204736232757568
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,6144,2560,8,160,1,8,balanced,0.4833279848098755
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,4096,1536,8,128,8,1,power_law_1.2,0.1703871965408325
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,6144,2560,8,160,1,8,balanced,0.4856479962666829
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,4096,1536,8,128,8,1,power_law_1.2,1.015231990814209
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,6144,2560,8,160,1,8,balanced,0.48792533079783124
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,4096,1536,8,128,8,1,power_law_1.2,0.17562880516052246
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,6144,2560,8,160,1,8,balanced,0.48946134249369305
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,4096,1536,8,128,8,1,power_law_1.2,1.327571201324463
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,4096,1536,8,128,8,1,power_law_1.2,0.19101439714431762
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,6144,2560,8,160,1,8,balanced,0.49478399753570557
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,4096,1536,8,128,8,1,power_law_1.2,1.9475711822509765
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,6144,2560,8,160,1,8,balanced,0.4984533389409383
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,4096,1536,8,128,8,1,power_law_1.2,0.20577919483184814
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,6144,2560,8,160,1,8,balanced,0.5044800043106079
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,4096,1536,8,128,8,1,power_law_1.2,0.2185983896255493
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,4096,1536,8,128,8,1,power_law_1.2,2.5621055603027343
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,6144,2560,8,160,1,8,balanced,0.5192053318023682
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,4096,1536,8,128,8,1,power_law_1.2,0.24561920166015624
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,6144,2560,8,160,1,8,balanced,0.5122666756312052
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,4096,1536,8,128,8,1,power_law_1.2,3.176595115661621
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,6144,2560,8,160,1,8,balanced,0.5935946702957153
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,6144,2560,8,160,1,8,balanced,0.5451733271280924
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,4096,1536,8,128,8,1,power_law_1.2,5.089888000488282
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,4096,1536,8,128,8,1,power_law_1.2,0.26488959789276123
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,4096,1536,8,128,8,1,power_law_1.2,0.2894975900650024
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,6144,2560,8,160,1,8,balanced,0.8596746921539307
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,4096,1536,8,128,8,1,power_law_1.2,10.388813018798828
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,6144,2560,8,160,1,8,balanced,0.616207997004191
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,4096,1536,8,128,8,1,power_law_1.2,0.3284800052642822
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,4096,1536,8,128,8,1,power_law_1.2,0.4302207946777344
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,6144,2560,8,160,1,8,balanced,1.0286133289337158
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,4096,1536,8,128,8,1,power_law_1.2,0.5122560024261474
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,4096,1536,8,128,8,1,power_law_1.2,0.6908031940460205
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,6144,2560,8,160,1,8,balanced,0.8273813724517822
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,4096,1536,8,128,8,1,power_law_1.2,0.8574336051940918
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,4096,1536,8,128,8,1,power_law_1.2,1.190060806274414
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,6144,2560,8,160,1,8,balanced,1.4462773005167644
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,4096,1536,8,128,8,1,power_law_1.2,1.522489643096924
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,4096,1536,8,128,8,1,power_law_1.2,2.196294403076172
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,4096,1536,8,128,8,1,power_law_1.2,2.883462333679199
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,6144,2560,8,160,1,8,balanced,1.4485386212666829
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,4096,1536,8,128,8,1,power_law_1.2,4.240447998046875
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,4096,1536,8,128,8,1,power_law_1.2,5.588499069213867
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,4096,1536,8,128,8,1,power_law_1.2,6.95362548828125
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,4096,1536,8,128,8,1,power_law_1.2,10.993260955810547
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,6144,2560,8,160,1,8,balanced,2.0855253537495932
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,6144,2560,8,160,1,8,balanced,0.05541333556175232
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,4096,1536,8,128,8,1,power_law_1.2,21.805311584472655
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,6144,2560,8,160,1,8,balanced,0.06531199812889099
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,6144,2560,8,160,1,8,balanced,0.08904533584912618
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,6144,2560,8,160,1,8,balanced,0.1370186706384023
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,6144,2560,8,160,1,8,balanced,0.22336000204086304
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,6144,2560,8,160,1,8,balanced,0.2741653323173523
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,6144,2560,8,160,1,8,balanced,2.788693428039551
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,6144,2560,8,160,1,8,balanced,0.2761920094490051
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,6144,2560,8,160,1,8,balanced,0.2725866635640462
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,6144,2560,8,160,1,8,balanced,0.27534399429957074
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,6144,2560,8,160,1,8,balanced,0.2748639980951945
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,6144,2560,8,160,1,8,balanced,0.27780266602834064
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,6144,2560,8,160,1,8,balanced,0.27909332513809204
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,6144,2560,8,160,1,8,power_law_1.01,0.2201024055480957
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,6144,2560,8,160,1,8,balanced,0.2796693245569865
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,6144,2560,8,160,1,8,power_law_1.01,0.30020480155944823
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,6144,2560,8,160,1,8,balanced,2.975104014078776
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,6144,2560,8,160,1,8,balanced,0.2837173342704773
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,6144,2560,8,160,1,8,power_law_1.01,0.15056639909744263
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,6144,2560,8,160,1,8,balanced,0.29214932521184284
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,6144,2560,8,160,1,8,power_law_1.01,0.20485119819641112
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,6144,2560,8,160,1,8,balanced,0.2985919912656148
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,6144,2560,8,160,1,8,power_law_1.01,0.1307136058807373
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,6144,2560,8,160,1,8,power_law_1.01,0.2677504062652588
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,6144,2560,8,160,1,8,balanced,0.3027199904123942
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,6144,2560,8,160,1,8,power_law_1.01,0.18874239921569824
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,6144,2560,8,160,1,8,power_law_1.01,0.4003392219543457
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,6144,2560,8,160,1,8,balanced,0.3821760018666585
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,6144,2560,8,160,1,8,power_law_1.01,0.09048320055007934
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,6144,2560,8,160,1,8,power_law_1.01,0.416864013671875
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,6144,2560,8,160,1,8,balanced,0.05309866865475973
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,6144,2560,8,160,1,8,balanced,0.33292800188064575
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,6144,2560,8,160,1,8,power_law_1.01,0.13508479595184325
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,6144,2560,8,160,1,8,power_law_1.01,0.42113280296325684
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,6144,2560,8,160,1,8,balanced,0.06324266890684764
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,6144,2560,8,160,1,8,power_law_1.01,0.16575360298156738
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,6144,2560,8,160,1,8,balanced,0.46695466836293537
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,6144,2560,8,160,1,8,power_law_1.01,0.4340735912322998
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,6144,2560,8,160,1,8,balanced,0.09244799613952637
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,6144,2560,8,160,1,8,power_law_1.01,0.22303359508514403
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,6144,2560,8,160,1,8,power_law_1.01,0.46323838233947756
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,6144,2560,8,160,1,8,balanced,0.14291733503341675
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,6144,2560,8,160,1,8,power_law_1.01,0.2508863925933838
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,6144,2560,8,160,1,8,balanced,0.39979732036590576
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,6144,2560,8,160,1,8,power_law_1.01,0.47793917655944823
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,6144,2560,8,160,1,8,power_law_1.01,0.24223361015319825
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,6144,2560,8,160,1,8,balanced,0.22207466761271158
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,6144,2560,8,160,1,8,power_law_1.01,0.49872641563415526
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,6144,2560,8,160,1,8,power_law_1.01,0.24501121044158936
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,6144,2560,8,160,1,8,balanced,0.27216533819834393
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,6144,2560,8,160,1,8,balanced,0.6622666517893473
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,6144,2560,8,160,1,8,power_law_1.01,0.24997119903564452
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,6144,2560,8,160,1,8,power_law_1.01,0.5197055816650391
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,6144,2560,8,160,1,8,balanced,4.982229232788086
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,6144,2560,8,160,1,8,balanced,0.27457600831985474
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,6144,2560,8,160,1,8,power_law_1.01,0.25155839920043943
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,6144,2560,8,160,1,8,power_law_1.01,0.517248010635376
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,6144,2560,8,160,1,8,balanced,0.5658666690190634
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,6144,2560,8,160,1,8,balanced,0.27611732482910156
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,6144,2560,8,160,1,8,power_law_1.01,0.27119998931884765
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,6144,2560,8,160,1,8,power_law_1.01,0.5878464221954346
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,6144,2560,8,160,1,8,balanced,0.2765706578890483
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,6144,2560,8,160,1,8,power_law_1.01,0.2925184011459351
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,6144,2560,8,160,1,8,power_law_1.01,0.6162559986114502
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,6144,2560,8,160,1,8,balanced,0.27932266394297284
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,6144,2560,8,160,1,8,power_law_1.01,0.29713280200958253
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,6144,2560,8,160,1,8,power_law_1.01,0.6012608051300049
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,6144,2560,8,160,1,8,balanced,0.9426453113555908
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,6144,2560,8,160,1,8,balanced,0.2815306584040324
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,6144,2560,8,160,1,8,power_law_1.01,0.31959679126739504
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,6144,2560,8,160,1,8,power_law_1.01,0.7398784160614014
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,6144,2560,8,160,1,8,power_law_1.01,0.35641601085662844
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,6144,2560,8,160,1,8,balanced,0.283077339331309
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,6144,2560,8,160,1,8,power_law_1.01,0.7665088176727295
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,6144,2560,8,160,1,8,power_law_1.01,0.13808000087738037
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,6144,2560,8,160,1,8,power_law_1.01,0.3347968101501465
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,6144,2560,8,160,1,8,balanced,0.2863679925600688
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,6144,2560,8,160,1,8,power_law_1.01,0.8769280433654785
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,6144,2560,8,160,1,8,power_law_1.01,0.42259202003479
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,6144,2560,8,160,1,8,power_law_1.01,0.20570878982543944
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,6144,2560,8,160,1,8,balanced,0.29132266839345294
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,6144,2560,8,160,1,8,balanced,0.9970133304595947
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,6144,2560,8,160,1,8,power_law_1.01,0.41509761810302737
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,6144,2560,8,160,1,8,power_law_1.01,0.9373824119567871
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,6144,2560,8,160,1,8,power_law_1.01,0.09404799938201905
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,6144,2560,8,160,1,8,balanced,0.29783467451731366
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,6144,2560,8,160,1,8,power_law_1.01,0.533465576171875
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,6144,2560,8,160,1,8,power_law_1.01,1.1395135879516602
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,6144,2560,8,160,1,8,power_law_1.01,0.13578879833221436
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,6144,2560,8,160,1,8,power_law_1.01,0.6208640098571777
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,6144,2560,8,160,1,8,power_law_1.01,1.478112030029297
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,6144,2560,8,160,1,8,power_law_1.01,0.1638975977897644
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,6144,2560,8,160,1,8,power_law_1.01,0.7843008041381836
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,6144,2560,8,160,1,8,power_law_1.01,1.9070720672607422
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,6144,2560,8,160,1,8,power_law_1.01,0.8978303909301758
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,6144,2560,8,160,1,8,power_law_1.01,0.22310400009155273
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,6144,2560,8,160,1,8,balanced,1.3385173479715984
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,6144,2560,8,160,1,8,power_law_1.01,2.282156753540039
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,6144,2560,8,160,1,8,balanced,0.3068373401959737
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,6144,2560,8,160,1,8,power_law_1.01,1.2187135696411133
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,6144,2560,8,160,1,8,power_law_1.01,0.24339840412139893
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,6144,2560,8,160,1,8,power_law_1.01,3.1954111099243163
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,6144,2560,8,160,1,8,power_law_1.01,1.3941184043884278
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,6144,2560,8,160,1,8,power_law_1.01,0.24184319972991944
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,6144,2560,8,160,1,8,power_law_1.01,2.0786367416381837
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,6144,2560,8,160,1,8,power_law_1.01,0.2627648115158081
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,6144,2560,8,160,1,8,power_law_1.01,3.7836990356445312
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,6144,2560,8,160,1,8,power_law_1.01,0.26153600215911865
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,6144,2560,8,160,1,8,power_law_1.01,2.6233600616455077
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,6144,2560,8,160,1,8,power_law_1.01,4.991321563720703
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,6144,2560,8,160,1,8,balanced,0.3184906641642253
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,6144,2560,8,160,1,8,power_law_1.01,0.2828736066818237
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,6144,2560,8,160,1,8,power_law_1.01,3.4068225860595702
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,6144,2560,8,160,1,8,power_law_1.01,0.3050431966781616
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,6144,2560,8,160,1,8,power_law_1.01,8.578982543945312
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,6144,2560,8,160,1,8,balanced,1.7365226745605469
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,6144,2560,8,160,1,8,power_law_1.01,4.9373119354248045
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,6144,2560,8,160,1,8,power_law_1.01,0.3219327926635742
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,6144,2560,8,160,1,8,power_law_1.01,0.33710079193115233
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,6144,2560,8,160,1,8,power_law_1.01,15.676634216308594
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,6144,2560,8,160,1,8,power_law_1.01,9.62551040649414
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,6144,2560,8,160,1,8,power_law_1.01,0.38800640106201173
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,6144,2560,8,160,1,8,balanced,8.981930414835611
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,6144,2560,8,160,1,8,balanced,0.3405493497848511
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,6144,2560,8,160,1,8,power_law_1.01,0.37151360511779785
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,6144,2560,8,160,1,8,balanced,0.3601013422012329
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,6144,2560,8,160,1,8,power_law_1.01,0.38032639026641846
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,6144,2560,8,160,1,8,balanced,2.0345333417256675
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,6144,2560,8,160,1,8,power_law_1.2,0.2275264024734497
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,6144,2560,8,160,1,8,power_law_1.01,0.42282881736755373
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,6144,2560,8,160,1,8,power_law_1.2,0.13932160139083863
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,6144,2560,8,160,1,8,power_law_1.01,0.48035202026367185
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,6144,2560,8,160,1,8,balanced,0.4124373197555542
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,6144,2560,8,160,1,8,power_law_1.2,0.14824960231781006
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,6144,2560,8,160,1,8,power_law_1.2,0.23308799266815186
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,6144,2560,8,160,1,8,power_law_1.01,0.5846528053283692
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,6144,2560,8,160,1,8,power_law_1.2,0.26508800983428954
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,6144,2560,8,160,1,8,balanced,0.45984001954396564
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,6144,2560,8,160,1,8,power_law_1.2,0.41441922187805175
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,6144,2560,8,160,1,8,power_law_1.01,0.752569580078125
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,6144,2560,8,160,1,8,power_law_1.2,0.4080639839172363
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,6144,2560,8,160,1,8,power_law_1.2,0.45311360359191893
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,6144,2560,8,160,1,8,power_law_1.01,0.9922623634338379
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,6144,2560,8,160,1,8,balanced,0.696570634841919
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,6144,2560,8,160,1,8,power_law_1.2,0.45638399124145507
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,6144,2560,8,160,1,8,power_law_1.01,1.1208959579467774
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,6144,2560,8,160,1,8,power_law_1.2,0.4746816158294678
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,6144,2560,8,160,1,8,power_law_1.2,0.49170560836791993
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,6144,2560,8,160,1,8,power_law_1.01,1.7300800323486327
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,6144,2560,8,160,1,8,balanced,0.7916639645894369
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,6144,2560,8,160,1,8,power_law_1.2,0.5072703838348389
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,6144,2560,8,160,1,8,power_law_1.01,2.380121612548828
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,6144,2560,8,160,1,8,balanced,3.207749366760254
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,6144,2560,8,160,1,8,power_law_1.2,0.5315775871276855
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,6144,2560,8,160,1,8,power_law_1.2,0.5768064022064209
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,6144,2560,8,160,1,8,power_law_1.01,3.45797119140625
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,6144,2560,8,160,1,8,power_law_1.2,0.6304192066192627
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,6144,2560,8,160,1,8,balanced,1.143770694732666
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,6144,2560,8,160,1,8,power_law_1.01,4.244102478027344
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,6144,2560,8,160,1,8,power_law_1.2,0.7387263774871826
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,6144,2560,8,160,1,8,power_law_1.2,0.1411967992782593
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,6144,2560,8,160,1,8,power_law_1.2,0.6571392059326172
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,6144,2560,8,160,1,8,power_law_1.01,6.056121444702148
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,6144,2560,8,160,1,8,power_law_1.2,0.07758079767227173
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,6144,2560,8,160,1,8,power_law_1.2,0.8004608154296875
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,6144,2560,8,160,1,8,power_law_1.2,0.8348992347717286
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,6144,2560,8,160,1,8,power_law_1.2,0.09423999786376953
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,6144,2560,8,160,1,8,power_law_1.01,9.036768341064453
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,6144,2560,8,160,1,8,power_law_1.2,0.9822208404541015
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,6144,2560,8,160,1,8,power_law_1.2,0.1279039978981018
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,6144,2560,8,160,1,8,balanced,1.5055893262227376
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,6144,2560,8,160,1,8,power_law_1.2,1.0199040412902831
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,6144,2560,8,160,1,8,power_law_1.2,0.15271040201187133
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,6144,2560,8,160,1,8,power_law_1.2,1.3513983726501464
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,6144,2560,8,160,1,8,power_law_1.01,18.703890991210937
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,6144,2560,8,160,1,8,power_law_1.2,0.21101438999176025
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,6144,2560,8,160,1,8,power_law_1.2,1.8535423278808594
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,6144,2560,8,160,1,8,power_law_1.2,2.190809631347656
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,6144,2560,8,160,1,8,power_law_1.2,0.23623039722442626
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,6144,2560,8,160,1,8,power_law_1.2,2.669203186035156
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,6144,2560,8,160,1,8,power_law_1.2,0.23963520526885987
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,6144,2560,8,160,1,8,balanced,2.049488067626953
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,6144,2560,8,160,1,8,power_law_1.2,3.5609535217285155
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,6144,2560,8,160,1,8,power_law_1.2,0.2552896022796631
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,6144,2560,8,160,1,8,power_law_1.2,4.462195205688476
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,6144,2560,8,160,1,8,power_law_1.2,0.26480000019073485
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,6144,2560,8,160,1,8,power_law_1.2,0.27834880352020264
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,6144,2560,8,160,1,8,power_law_1.2,7.7766845703125
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,6144,2560,8,160,1,8,power_law_1.2,0.28703999519348145
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,6144,2560,8,160,1,8,power_law_1.2,11.74645767211914
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,6144,2560,8,160,1,8,power_law_1.2,0.30443520545959474
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,6144,2560,8,160,1,8,power_law_1.2,0.31137919425964355
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,6144,2560,8,160,1,8,power_law_1.2,0.33616640567779543
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,6144,2560,8,160,1,8,balanced,2.748314539591471
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,6144,2560,8,160,1,8,power_law_1.2,25.36290588378906
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,6144,2560,8,160,1,8,power_law_1.2,0.3531008005142212
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,6144,2560,8,160,1,8,power_law_1.2,0.3694400072097778
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,6144,2560,8,160,1,8,power_law_1.2,0.4822591781616211
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,6144,2560,8,160,1,8,power_law_1.2,0.4508224010467529
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,6144,2560,8,160,1,8,balanced,6.2821706136067705
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,6144,2560,8,160,1,8,power_law_1.2,0.5859007835388184
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,6144,2560,8,160,1,8,power_law_1.2,0.6686016082763672
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,6144,2560,8,160,1,8,power_law_1.2,0.8348223686218261
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,6144,2560,8,160,1,8,power_law_1.2,1.080179214477539
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,6144,2560,8,160,1,8,balanced,3.288122812906901
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,6144,2560,8,160,1,8,power_law_1.2,1.3555264472961426
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,6144,2560,8,160,1,8,power_law_1.2,1.8168960571289063
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,6144,2560,8,160,1,8,power_law_1.2,2.5456384658813476
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,6144,2560,8,160,1,8,power_law_1.2,3.272480010986328
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,6144,2560,8,160,1,8,power_law_1.2,4.005126571655273
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,6144,2560,8,160,1,8,power_law_1.2,5.81187858581543
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,6144,2560,8,160,1,8,power_law_1.2,14.364370727539063
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,6144,2560,8,160,1,8,balanced,5.291221300760905
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,6144,2560,8,160,2,4,balanced,0.05266666909058889
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,6144,2560,8,160,2,4,balanced,0.06461333235104878
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,6144,2560,8,160,2,4,balanced,0.06504533191521962
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,6144,2560,8,160,2,4,balanced,0.08540266752243042
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,6144,2560,8,160,2,4,balanced,0.08947733044624329
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,6144,2560,8,160,2,4,balanced,0.12378133336702983
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,6144,2560,8,160,1,8,power_law_1.2,0.1385599970817566
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,6144,2560,8,160,2,4,balanced,0.1379039982954661
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,6144,2560,8,160,2,4,balanced,0.21996800104777017
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,6144,2560,8,160,2,4,balanced,0.22237332661946616
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,6144,2560,8,160,1,8,power_law_1.2,0.08171520233154297
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,6144,2560,8,160,2,4,balanced,0.39128533999125165
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,6144,2560,8,160,1,8,power_law_1.2,0.09616000056266785
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,6144,2560,8,160,2,4,balanced,0.26632533470789593
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,6144,2560,8,160,1,8,power_law_1.2,0.1186560034751892
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,6144,2560,8,160,2,4,balanced,0.48811201254526776
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,6144,2560,8,160,2,4,balanced,0.2701653242111206
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,6144,2560,8,160,1,8,power_law_1.2,0.15118080377578735
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,6144,2560,8,160,2,4,balanced,0.48789334297180176
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,6144,2560,8,160,2,4,balanced,0.2722559968630473
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,6144,2560,8,160,1,8,power_law_1.2,0.20534400939941405
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,6144,2560,8,160,2,4,balanced,0.5001173416773478
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,6144,2560,8,160,1,8,power_law_1.2,0.2395711898803711
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,6144,2560,8,160,2,4,balanced,0.27171732981999713
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,6144,2560,8,160,1,8,power_law_1.2,0.24451839923858643
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,6144,2560,8,160,2,4,balanced,0.5013013283411661
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,6144,2560,8,160,2,4,balanced,0.27641065915425617
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,6144,2560,8,160,1,8,power_law_1.2,0.2679807901382446
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,6144,2560,8,160,2,4,balanced,0.5030186573664347
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,6144,2560,8,160,1,8,power_law_1.2,0.26384639739990234
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,6144,2560,8,160,2,4,balanced,0.2784000039100647
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,6144,2560,8,160,1,8,balanced,10.616997400919596
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,6144,2560,8,160,1,8,power_law_1.2,0.28901119232177735
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,6144,2560,8,160,2,4,balanced,0.4984000126520793
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,6144,2560,8,160,2,4,balanced,0.2808799942334493
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,6144,2560,8,160,1,8,power_law_1.2,0.3058687925338745
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,6144,2560,8,160,2,4,balanced,0.4972746769587199
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,6144,2560,8,160,1,8,power_law_1.2,0.33043200969696046
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,6144,2560,8,160,2,4,balanced,0.28194665908813477
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,6144,2560,8,160,2,4,balanced,0.5018666585286459
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,6144,2560,8,160,1,8,power_law_1.2,0.36988799571990966
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,6144,2560,8,160,2,4,balanced,0.29074132442474365
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,6144,2560,8,160,1,8,power_law_1.2,0.3975487947463989
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,6144,2560,8,160,2,4,balanced,0.508346676826477
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,6144,2560,8,160,2,4,balanced,0.2961120009422302
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,6144,2560,8,160,2,4,balanced,0.515936017036438
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,6144,2560,8,160,2,4,balanced,0.3196106751759847
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,6144,2560,8,160,1,8,power_law_1.2,0.3780224084854126
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,6144,2560,8,160,2,4,balanced,0.5252853234608968
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,6144,2560,8,160,2,4,balanced,0.31248533725738525
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,6144,2560,8,160,2,4,balanced,0.5298186540603638
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,6144,2560,8,160,2,4,balanced,0.3964960177739461
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,6144,2560,8,160,1,8,power_law_1.2,0.3997951984405518
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,6144,2560,8,160,2,4,balanced,0.5653333266576132
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,6144,2560,8,160,2,4,balanced,0.34914131959279376
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,6144,2560,8,160,2,4,balanced,0.5672053496042887
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,6144,2560,8,160,2,4,balanced,0.5038400093714396
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,6144,2560,8,160,1,8,power_law_1.2,0.4566336154937744
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,6144,2560,8,160,1,8,power_law_1.2,0.5535103797912597
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,6144,2560,8,160,2,4,balanced,0.8938079675038656
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,6144,2560,8,160,2,4,balanced,0.43451201915740967
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,6144,2560,8,160,2,4,balanced,0.648746649424235
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,6144,2560,8,160,1,8,power_law_1.2,0.6371263980865478
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,6144,2560,8,160,2,4,balanced,0.6616799831390381
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,6144,2560,8,160,1,8,power_law_1.2,0.8766976356506347
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,6144,2560,8,160,1,8,power_law_1.2,1.0562496185302734
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,6144,2560,8,160,2,4,balanced,1.1498080094655354
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,6144,2560,8,160,1,8,power_law_1.2,1.4384703636169434
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,6144,2560,8,160,2,4,balanced,0.6350080172220866
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,6144,2560,8,160,1,8,power_law_1.2,2.2673791885375976
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,6144,2560,8,160,2,4,balanced,0.869914690653483
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,6144,2560,8,160,1,8,power_law_1.2,2.5594688415527345
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,6144,2560,8,160,2,4,balanced,0.056464001536369324
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,6144,2560,8,160,1,8,power_law_1.2,3.5950592041015623
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,6144,2560,8,160,2,4,balanced,0.06660800178845723
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,6144,2560,8,160,2,4,balanced,1.0532533327738445
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,6144,2560,8,160,1,8,power_law_1.2,5.983744049072266
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,6144,2560,8,160,2,4,balanced,0.0939573347568512
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,6144,2560,8,160,2,4,balanced,0.137855996688207
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,6144,2560,8,160,2,4,balanced,1.5348107020060222
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,6144,2560,8,160,1,8,power_law_1.2,6.952275085449219
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,6144,2560,8,160,2,4,balanced,0.22571200132369995
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,6144,2560,8,160,2,4,balanced,0.27510400613149005
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,6144,2560,8,160,1,8,power_law_1.2,11.880569458007812
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,6144,2560,8,160,2,4,balanced,1.1651093165079753
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,6144,2560,8,160,2,4,balanced,0.27774399518966675
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,6144,2560,8,160,2,4,balanced,0.28111465771993
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,6144,2560,8,160,2,4,balanced,1.5768639246622722
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,6144,2560,8,160,2,4,balanced,0.2830880085627238
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,6144,2560,8,160,1,8,power_law_1.2,26.518072509765624
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,6144,2560,8,160,2,4,balanced,0.2857919931411743
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,6144,2560,8,160,2,4,power_law_1.01,0.09619839787483216
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,6144,2560,8,160,2,4,balanced,0.2889813383420308
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,6144,2560,8,160,2,4,power_law_1.01,0.14268159866333008
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,6144,2560,8,160,2,4,balanced,0.29266132911046344
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,6144,2560,8,160,2,4,power_law_1.01,0.10828160047531128
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,6144,2560,8,160,2,4,balanced,1.550869305928548
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,6144,2560,8,160,2,4,balanced,0.29732799530029297
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,6144,2560,8,160,2,4,power_law_1.01,0.07885439991950989
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,6144,2560,8,160,2,4,power_law_1.01,0.16320639848709106
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,6144,2560,8,160,2,4,balanced,0.3057813247044881
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,6144,2560,8,160,2,4,power_law_1.01,0.12910079956054688
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,6144,2560,8,160,2,4,power_law_1.01,0.12791039943695068
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,6144,2560,8,160,2,4,balanced,2.1027040481567383
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,6144,2560,8,160,2,4,power_law_1.01,0.15039360523223877
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,6144,2560,8,160,2,4,balanced,0.31543999910354614
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,6144,2560,8,160,2,4,power_law_1.01,0.17093759775161743
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,6144,2560,8,160,2,4,power_law_1.01,0.22115840911865234
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,6144,2560,8,160,2,4,power_law_1.01,0.23342080116271974
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,6144,2560,8,160,2,4,power_law_1.01,0.23155200481414795
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,6144,2560,8,160,2,4,power_law_1.01,0.38494720458984377
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,6144,2560,8,160,2,4,power_law_1.01,0.23737599849700927
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,6144,2560,8,160,2,4,power_law_1.01,0.40684800148010253
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,6144,2560,8,160,2,4,power_law_1.01,0.24677760601043702
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,6144,2560,8,160,2,4,balanced,0.3232799967130025
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,6144,2560,8,160,2,4,power_law_1.01,0.4264959812164307
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,6144,2560,8,160,2,4,balanced,2.0552426973978677
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,6144,2560,8,160,2,4,power_law_1.01,0.24225280284881592
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,6144,2560,8,160,2,4,power_law_1.01,0.4312895774841309
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,6144,2560,8,160,2,4,power_law_1.01,0.26331520080566406
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,6144,2560,8,160,2,4,balanced,2.7122348149617515
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,6144,2560,8,160,2,4,power_law_1.01,0.26547200679779054
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,6144,2560,8,160,2,4,power_law_1.01,0.43240962028503416
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,6144,2560,8,160,2,4,power_law_1.01,0.2836735963821411
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,6144,2560,8,160,2,4,power_law_1.01,0.4615935802459717
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,6144,2560,8,160,2,4,power_law_1.01,0.29028480052947997
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,6144,2560,8,160,2,4,balanced,0.3410826524098714
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,6144,2560,8,160,2,4,power_law_1.01,0.4634687900543213
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,6144,2560,8,160,2,4,power_law_1.01,0.31138560771942136
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,6144,2560,8,160,2,4,power_law_1.01,0.48557438850402834
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,6144,2560,8,160,2,4,power_law_1.01,0.3183232069015503
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,6144,2560,8,160,2,4,power_law_1.01,0.4763775825500488
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,6144,2560,8,160,2,4,power_law_1.01,0.33189759254455564
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,6144,2560,8,160,2,4,power_law_1.01,0.5157631874084473
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,6144,2560,8,160,2,4,power_law_1.01,0.41809921264648436
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,6144,2560,8,160,2,4,balanced,2.4574294090270996
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,6144,2560,8,160,2,4,power_law_1.01,0.5273600101470948
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,6144,2560,8,160,2,4,power_law_1.01,0.43323521614074706
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,6144,2560,8,160,2,4,power_law_1.01,0.5730175971984863
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,6144,2560,8,160,2,4,power_law_1.01,0.525324821472168
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,6144,2560,8,160,2,4,balanced,3.1510559717814126
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,6144,2560,8,160,2,4,balanced,0.378165324529012
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,6144,2560,8,160,2,4,power_law_1.01,0.5538432121276855
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,6144,2560,8,160,2,4,power_law_1.01,0.6533631801605224
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,6144,2560,8,160,2,4,power_law_1.01,0.7067967891693115
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,6144,2560,8,160,2,4,power_law_1.01,0.6901311874389648
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,6144,2560,8,160,2,4,balanced,0.41330134868621826
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,6144,2560,8,160,2,4,power_law_1.01,0.9071167945861817
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,6144,2560,8,160,2,4,power_law_1.01,0.8884032249450684
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,6144,2560,8,160,2,4,power_law_1.01,1.1946368217468262
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,6144,2560,8,160,2,4,power_law_1.01,0.9505215644836426
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,6144,2560,8,160,2,4,power_law_1.01,0.09653120040893555
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,6144,2560,8,160,2,4,power_law_1.01,1.3180095672607421
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,6144,2560,8,160,2,4,power_law_1.01,1.1399744033813477
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,6144,2560,8,160,2,4,balanced,0.5081066687901815
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,6144,2560,8,160,2,4,power_law_1.01,0.09796479940414429
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,6144,2560,8,160,2,4,power_law_1.01,1.3865407943725585
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,6144,2560,8,160,2,4,power_law_1.01,1.7237503051757812
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,6144,2560,8,160,2,4,power_law_1.01,0.08798080086708068
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,6144,2560,8,160,2,4,balanced,0.5791360139846802
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,6144,2560,8,160,2,4,power_law_1.01,1.7774272918701173
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,6144,2560,8,160,2,4,power_law_1.01,2.612857627868652
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,6144,2560,8,160,2,4,power_law_1.01,0.12007679939270019
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,6144,2560,8,160,2,4,power_law_1.01,1.8823423385620117
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,6144,2560,8,160,2,4,power_law_1.01,3.096678352355957
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,6144,2560,8,160,2,4,power_law_1.01,0.15688960552215575
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,6144,2560,8,160,2,4,balanced,0.8671893278757731
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,6144,2560,8,160,2,4,power_law_1.01,2.8013248443603516
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,6144,2560,8,160,2,4,power_law_1.01,0.22787199020385743
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,6144,2560,8,160,2,4,power_law_1.01,4.754784011840821
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,6144,2560,8,160,2,4,balanced,3.827258745829264
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,6144,2560,8,160,2,4,power_law_1.01,0.23992319107055665
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,6144,2560,8,160,2,4,power_law_1.01,3.6241214752197264
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,6144,2560,8,160,2,4,balanced,1.0102346738179524
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,6144,2560,8,160,2,4,power_law_1.01,0.24494719505310059
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,6144,2560,8,160,2,4,power_law_1.01,9.34637451171875
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,6144,2560,8,160,2,4,power_law_1.01,0.25116159915924074
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,6144,2560,8,160,2,4,power_law_1.01,4.935968017578125
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,6144,2560,8,160,2,4,balanced,5.041333198547363
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,6144,2560,8,160,2,4,power_law_1.01,0.2717695951461792
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,6144,2560,8,160,2,4,power_law_1.01,7.067635345458984
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,6144,2560,8,160,2,4,power_law_1.01,0.2864448070526123
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,6144,2560,8,160,2,4,balanced,1.4832266171773274
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,6144,2560,8,160,2,4,power_law_1.01,0.30906240940093993
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,6144,2560,8,160,2,4,power_law_1.01,0.32286078929901124
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,6144,2560,8,160,2,4,power_law_1.01,13.820230102539062
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,6144,2560,8,160,2,4,power_law_1.01,0.35344638824462893
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,6144,2560,8,160,2,4,balanced,1.9403039614359539
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,6144,2560,8,160,2,4,power_law_1.01,0.38800640106201173
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,6144,2560,8,160,2,4,power_law_1.01,0.38040320873260497
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,6144,2560,8,160,2,4,balanced,2.679370562235514
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,6144,2560,8,160,2,4,power_law_1.01,0.4020224094390869
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,6144,2560,8,160,2,4,power_law_1.01,0.4493375778198242
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,6144,2560,8,160,2,4,power_law_1.01,0.5133312225341797
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,6144,2560,8,160,2,4,power_law_1.01,0.6244095802307129
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,6144,2560,8,160,2,4,power_law_1.2,0.1423424005508423
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,6144,2560,8,160,2,4,power_law_1.01,0.7374080181121826
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,6144,2560,8,160,2,4,power_law_1.2,0.12040959596633911
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,6144,2560,8,160,2,4,balanced,3.5763734181722007
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,6144,2560,8,160,2,4,power_law_1.01,1.0104640007019043
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,6144,2560,8,160,2,4,power_law_1.2,0.1193727970123291
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,6144,2560,8,160,2,4,power_law_1.01,1.2584704399108886
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,6144,2560,8,160,2,4,power_law_1.2,0.19481600522994996
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,6144,2560,8,160,2,4,power_law_1.01,1.840287971496582
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,6144,2560,8,160,2,4,power_law_1.2,0.2313215970993042
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,6144,2560,8,160,2,4,power_law_1.01,2.489740753173828
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,6144,2560,8,160,2,4,power_law_1.2,0.3889856100082397
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,6144,2560,8,160,2,4,balanced,7.539130528767903
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,6144,2560,8,160,2,4,power_law_1.2,0.42420477867126466
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,6144,2560,8,160,2,4,power_law_1.01,3.338092803955078
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,6144,2560,8,160,2,4,power_law_1.2,0.4251904010772705
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,6144,2560,8,160,2,4,power_law_1.01,4.178963088989258
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,6144,2560,8,160,2,4,balanced,9.856576283772787
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,6144,2560,8,160,2,4,power_law_1.2,0.443449592590332
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,6144,2560,8,160,2,4,power_law_1.2,0.4585536003112793
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,6144,2560,8,160,2,4,balanced,4.325589179992676
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,6144,2560,8,160,2,4,power_law_1.01,5.914879989624024
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,6144,2560,8,160,2,4,power_law_1.2,0.4695551872253418
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,6144,2560,8,160,2,4,power_law_1.01,8.879551696777344
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,6144,2560,8,160,2,4,power_law_1.2,0.5211008071899415
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,6144,2560,8,160,2,4,power_law_1.2,0.5355584144592285
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,6144,2560,8,160,2,4,power_law_1.01,17.629714965820312
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,6144,2560,8,160,2,4,power_law_1.2,0.4865664005279541
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,6144,2560,8,160,2,4,power_law_1.2,0.5257919788360595
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,6144,2560,8,160,2,4,power_law_1.2,0.5581952095031738
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,6144,2560,8,160,2,4,power_law_1.2,0.5996352195739746
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,6144,2560,8,160,2,4,power_law_1.2,0.7211328029632569
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,6144,2560,8,160,2,4,power_law_1.2,0.09063040018081665
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,6144,2560,8,160,2,4,power_law_1.2,0.7539008140563965
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,6144,2560,8,160,2,4,power_law_1.2,0.06273919939994813
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,6144,2560,8,160,2,4,power_law_1.2,0.08458880186080933
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,6144,2560,8,160,2,4,power_law_1.2,0.9272768020629882
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,6144,2560,8,160,2,4,power_law_1.2,0.10892159938812256
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,6144,2560,8,160,2,4,balanced,6.933322906494141
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,6144,2560,8,160,2,4,power_law_1.2,0.13500159978866577
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,6144,2560,8,160,2,4,power_law_1.2,1.0020095825195312
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,6144,2560,8,160,2,4,power_law_1.2,0.21464319229125978
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,6144,2560,8,160,2,4,power_law_1.2,1.1698047637939453
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,6144,2560,8,160,2,4,power_law_1.2,0.23595519065856935
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,6144,2560,8,160,2,4,power_law_1.2,0.23633279800415039
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,6144,2560,8,160,2,4,power_law_1.2,1.5101311683654786
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,6144,2560,8,160,2,4,power_law_1.2,0.24642560482025147
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,6144,2560,8,160,2,4,power_law_1.2,1.8990207672119142
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,6144,2560,8,160,2,4,power_law_1.2,0.24627199172973632
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,6144,2560,8,160,2,4,power_law_1.2,0.26677119731903076
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,6144,2560,8,160,2,4,power_law_1.2,2.2113216400146483
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,6144,2560,8,160,2,4,power_law_1.2,0.2776704072952271
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,6144,2560,8,160,2,4,power_law_1.2,3.36682243347168
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,6144,2560,8,160,2,4,power_law_1.2,0.28085761070251464
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,6144,2560,8,160,2,4,power_law_1.2,0.2939903974533081
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,6144,2560,8,160,2,4,power_law_1.2,4.078355026245117
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,6144,2560,8,160,2,4,power_law_1.2,0.31806719303131104
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,6144,2560,8,160,2,4,power_law_1.2,0.33626880645751955
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,6144,2560,8,160,2,4,power_law_1.2,5.197439956665039
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,6144,2560,8,160,2,4,power_law_1.2,0.35846400260925293
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,6144,2560,8,160,2,4,power_law_1.2,0.42557439804077146
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,6144,2560,8,160,2,4,power_law_1.2,0.4411263942718506
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,6144,2560,8,160,2,4,power_law_1.2,8.664390563964844
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,6144,2560,8,160,2,4,power_law_1.2,0.5222911834716797
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,6144,2560,8,160,2,4,power_law_1.2,0.584339189529419
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,6144,2560,8,160,2,4,power_law_1.2,15.857344055175782
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,6144,2560,8,160,2,4,power_law_1.2,0.7894015789031983
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,6144,2560,8,160,2,4,power_law_1.2,1.0399807929992675
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,6144,2560,8,160,2,4,power_law_1.2,1.2733247756958008
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,6144,2560,8,160,2,4,power_law_1.2,1.517311954498291
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,6144,2560,8,160,2,4,power_law_1.2,1.9658432006835938
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,6144,2560,8,160,2,4,power_law_1.2,2.6179584503173827
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,6144,2560,8,160,2,4,power_law_1.2,3.3555839538574217
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,6144,2560,8,160,2,4,power_law_1.2,5.73889274597168
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,6144,2560,8,160,2,4,power_law_1.2,11.393824005126953
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,6144,2560,8,160,2,4,balanced,14.039658864339193
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,6144,2560,8,160,2,4,power_law_1.2,0.10027519464492798
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,6144,2560,8,160,2,4,power_law_1.2,0.08234239816665649
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,6144,2560,8,160,2,4,power_law_1.2,0.08770560026168824
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,6144,2560,8,160,2,4,power_law_1.2,0.12744959592819213
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,6144,2560,8,160,2,4,power_law_1.2,0.15287040472030639
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,6144,2560,8,160,4,2,balanced,0.0658133327960968
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,6144,2560,8,160,2,4,power_law_1.2,0.22772479057312012
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,6144,2560,8,160,4,2,balanced,0.08612799644470215
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,6144,2560,8,160,2,4,power_law_1.2,0.2398848056793213
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,6144,2560,8,160,4,2,balanced,0.12454400459925334
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,6144,2560,8,160,2,4,power_law_1.2,0.2568831920623779
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,6144,2560,8,160,4,2,balanced,0.22594666481018066
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,6144,2560,8,160,4,2,balanced,0.3928906520207723
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,6144,2560,8,160,2,4,power_law_1.2,0.26679039001464844
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,6144,2560,8,160,4,2,balanced,0.49039467175801593
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,6144,2560,8,160,2,4,power_law_1.2,0.2786751985549927
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,6144,2560,8,160,4,2,balanced,0.4924693504969279
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,6144,2560,8,160,2,4,power_law_1.2,0.29966719150543214
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,6144,2560,8,160,4,2,balanced,0.5144799947738647
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,6144,2560,8,160,2,4,power_law_1.2,0.3153088092803955
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,6144,2560,8,160,4,2,balanced,0.5216533342997233
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,6144,2560,8,160,2,4,power_law_1.2,0.3335103988647461
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,6144,2560,8,160,4,2,balanced,0.5176000197728475
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,6144,2560,8,160,2,4,power_law_1.2,0.3709503889083862
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,6144,2560,8,160,4,2,balanced,0.506437341372172
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,6144,2560,8,160,2,4,power_law_1.2,0.38253440856933596
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,6144,2560,8,160,4,2,balanced,0.5130346616109213
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,6144,2560,8,160,4,2,balanced,0.5139893293380737
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,6144,2560,8,160,4,2,balanced,0.5199679931004842
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,6144,2560,8,160,2,4,power_law_1.2,0.38525440692901614
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,6144,2560,8,160,4,2,balanced,0.5327359835306803
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,6144,2560,8,160,4,2,balanced,0.5347839991251627
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,6144,2560,8,160,2,4,power_law_1.2,0.40833277702331544
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,6144,2560,8,160,4,2,balanced,0.5496746699015299
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,6144,2560,8,160,4,2,balanced,0.6528213421503702
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,6144,2560,8,160,2,4,power_law_1.2,0.47318401336669924
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,6144,2560,8,160,4,2,balanced,0.052709331115086876
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,6144,2560,8,160,4,2,balanced,0.6102773348490397
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,6144,2560,8,160,2,4,power_law_1.2,0.5908095836639404
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,6144,2560,8,160,4,2,balanced,0.06599999964237213
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,6144,2560,8,160,4,2,balanced,0.6986880302429199
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,6144,2560,8,160,4,2,balanced,0.08943466345469157
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,6144,2560,8,160,2,4,power_law_1.2,0.7127423763275147
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,6144,2560,8,160,4,2,balanced,0.13917866349220276
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,6144,2560,8,160,2,4,power_law_1.2,0.8134911537170411
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,6144,2560,8,160,4,2,balanced,0.7094186941782633
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,6144,2560,8,160,4,2,balanced,0.22421866655349731
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,6144,2560,8,160,2,4,power_law_1.2,1.155622386932373
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,6144,2560,8,160,4,2,balanced,0.27220799525578815
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,6144,2560,8,160,4,2,balanced,0.27742934226989746
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,6144,2560,8,160,2,4,power_law_1.2,1.3662783622741699
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,6144,2560,8,160,4,2,balanced,1.0750400225321453
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,6144,2560,8,160,4,2,power_law_1.01,0.0906175971031189
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,6144,2560,8,160,4,2,balanced,0.276202658812205
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,6144,2560,8,160,2,4,power_law_1.2,2.172876739501953
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,6144,2560,8,160,4,2,balanced,0.0698773314555486
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,6144,2560,8,160,4,2,balanced,0.28004799286524457
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,6144,2560,8,160,4,2,power_law_1.01,0.10996479988098144
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,6144,2560,8,160,2,4,power_law_1.2,2.6848064422607423
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,6144,2560,8,160,4,2,power_law_1.01,0.10839040279388427
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,6144,2560,8,160,4,2,balanced,1.0390933354695637
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,6144,2560,8,160,4,2,balanced,0.2825813293457031
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,6144,2560,8,160,4,2,balanced,0.07577600081761678
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,6144,2560,8,160,4,2,power_law_1.01,0.16960639953613282
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,6144,2560,8,160,4,2,balanced,0.2888266642888387
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,6144,2560,8,160,2,4,power_law_1.2,3.8005313873291016
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,6144,2560,8,160,4,2,balanced,0.10257599751154582
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,6144,2560,8,160,4,2,power_law_1.01,0.24586880207061768
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,6144,2560,8,160,4,2,balanced,0.28915733098983765
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,6144,2560,8,160,4,2,power_law_1.01,0.380511999130249
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,6144,2560,8,160,4,2,balanced,0.14735466241836548
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,6144,2560,8,160,2,4,power_law_1.2,5.857907104492187
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,6144,2560,8,160,4,2,balanced,0.29201600948969525
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,6144,2560,8,160,4,2,power_law_1.01,0.4022655963897705
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,6144,2560,8,160,4,2,balanced,0.24288533131281534
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,6144,2560,8,160,4,2,balanced,1.9496159553527832
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,6144,2560,8,160,4,2,power_law_1.01,0.416153621673584
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,6144,2560,8,160,4,2,balanced,0.29660266637802124
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,6144,2560,8,160,4,2,balanced,0.30355199178059894
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,6144,2560,8,160,2,4,power_law_1.2,6.692467498779297
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,6144,2560,8,160,4,2,power_law_1.01,0.4236735820770264
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,6144,2560,8,160,4,2,balanced,0.29974399010340375
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,6144,2560,8,160,4,2,power_law_1.01,0.4429823875427246
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,6144,2560,8,160,4,2,balanced,0.31063467264175415
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,6144,2560,8,160,4,2,balanced,0.3031839927037557
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,6144,2560,8,160,4,2,power_law_1.01,0.4417088031768799
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,6144,2560,8,160,4,2,balanced,0.31961599985758465
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,6144,2560,8,160,2,4,power_law_1.2,10.329030609130859
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,6144,2560,8,160,4,2,power_law_1.01,0.4827136039733887
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,6144,2560,8,160,4,2,balanced,0.3063093423843384
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,6144,2560,8,160,4,2,balanced,1.8669759432474773
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,6144,2560,8,160,4,2,balanced,0.3344213167826335
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,6144,2560,8,160,4,2,power_law_1.01,0.48427519798278806
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,6144,2560,8,160,4,2,balanced,0.30796267588933307
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,6144,2560,8,160,4,2,power_law_1.01,0.503436803817749
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,6144,2560,8,160,4,2,balanced,0.31618666648864746
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,6144,2560,8,160,4,2,balanced,0.4548480113347371
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,6144,2560,8,160,4,2,power_law_1.01,0.5457087993621826
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,6144,2560,8,160,2,4,power_law_1.2,22.018605041503907
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,6144,2560,8,160,4,2,balanced,0.3227733373641968
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,6144,2560,8,160,4,2,power_law_1.01,0.5564415931701661
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,6144,2560,8,160,4,2,balanced,0.3967466751734416
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,6144,2560,8,160,4,2,balanced,0.32901867230733234
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,6144,2560,8,160,4,2,power_law_1.01,0.6314176082611084
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,6144,2560,8,160,4,2,power_law_1.01,0.7860352039337158
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,6144,2560,8,160,4,2,balanced,0.34303466478983563
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,6144,2560,8,160,4,2,balanced,0.47492798169453937
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,6144,2560,8,160,4,2,power_law_1.01,0.7417471885681153
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,6144,2560,8,160,4,2,balanced,0.3577013413111369
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,6144,2560,8,160,4,2,power_law_1.01,0.9395135879516602
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,6144,2560,8,160,4,2,balanced,2.482090632120768
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,6144,2560,8,160,4,2,power_law_1.01,0.9121600151062011
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,6144,2560,8,160,4,2,balanced,0.5107040007909139
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,6144,2560,8,160,4,2,power_law_1.01,1.0982080459594727
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,6144,2560,8,160,4,2,power_law_1.01,1.574009609222412
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,6144,2560,8,160,4,2,balanced,0.7624266942342123
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,6144,2560,8,160,4,2,power_law_1.01,2.0057472229003905
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,6144,2560,8,160,4,2,balanced,0.3736000061035156
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,6144,2560,8,160,4,2,power_law_1.01,2.052332878112793
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,6144,2560,8,160,4,2,power_law_1.01,2.8279232025146483
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,6144,2560,8,160,4,2,power_law_1.01,0.06744959950447083
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,6144,2560,8,160,4,2,balanced,0.8078880310058594
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,6144,2560,8,160,4,2,power_law_1.01,3.773561477661133
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,6144,2560,8,160,4,2,power_law_1.01,0.0782144010066986
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,6144,2560,8,160,4,2,balanced,0.40194133917490643
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,6144,2560,8,160,4,2,balanced,3.276026725769043
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,6144,2560,8,160,4,2,power_law_1.01,0.07976959943771363
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,6144,2560,8,160,4,2,power_law_1.01,4.74835205078125
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,6144,2560,8,160,4,2,power_law_1.01,0.11662080287933349
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,6144,2560,8,160,4,2,power_law_1.01,7.823513793945312
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,6144,2560,8,160,4,2,balanced,1.2838986714680989
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,6144,2560,8,160,4,2,power_law_1.01,0.13863680362701417
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,6144,2560,8,160,4,2,power_law_1.01,0.21505279541015626
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,6144,2560,8,160,4,2,power_law_1.01,13.661325073242187
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,6144,2560,8,160,4,2,power_law_1.01,0.22449278831481934
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,6144,2560,8,160,4,2,power_law_1.01,0.2445823907852173
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,6144,2560,8,160,4,2,power_law_1.2,0.09041919708251953
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,6144,2560,8,160,4,2,power_law_1.01,0.24854400157928466
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,6144,2560,8,160,4,2,balanced,0.4880319833755493
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,6144,2560,8,160,4,2,balanced,1.469823996225993
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,6144,2560,8,160,4,2,power_law_1.01,0.26074240207672117
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,6144,2560,8,160,4,2,power_law_1.2,0.0714303970336914
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,6144,2560,8,160,4,2,balanced,0.5508426825205485
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,6144,2560,8,160,4,2,power_law_1.01,0.2691328048706055
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,6144,2560,8,160,4,2,power_law_1.2,0.10717439651489258
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,6144,2560,8,160,4,2,power_law_1.01,0.2817728042602539
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,6144,2560,8,160,4,2,power_law_1.2,0.1510208010673523
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,6144,2560,8,160,4,2,balanced,3.9090665181477866
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,6144,2560,8,160,4,2,power_law_1.01,0.07982079982757569
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,6144,2560,8,160,4,2,power_law_1.2,0.22023680210113525
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,6144,2560,8,160,4,2,power_law_1.01,0.2893951892852783
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,6144,2560,8,160,4,2,power_law_1.01,0.09418240189552307
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,6144,2560,8,160,4,2,power_law_1.2,0.38075520992279055
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,6144,2560,8,160,4,2,balanced,0.6961440245310465
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,6144,2560,8,160,4,2,power_law_1.01,0.29582719802856444
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,6144,2560,8,160,4,2,balanced,2.048389275868734
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,6144,2560,8,160,4,2,power_law_1.01,0.09722880125045777
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,6144,2560,8,160,4,2,power_law_1.2,0.39765760898590086
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,6144,2560,8,160,4,2,power_law_1.01,0.3169536113739014
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,6144,2560,8,160,4,2,power_law_1.01,0.12961280345916748
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,6144,2560,8,160,4,2,power_law_1.2,0.41997442245483396
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,6144,2560,8,160,4,2,balanced,0.8144959608713785
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,6144,2560,8,160,4,2,power_law_1.01,0.33600640296936035
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,6144,2560,8,160,4,2,power_law_1.01,0.1585536003112793
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,6144,2560,8,160,4,2,power_law_1.2,0.44522881507873535
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,6144,2560,8,160,4,2,power_law_1.01,0.358022403717041
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,6144,2560,8,160,4,2,power_law_1.01,0.23980801105499266
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,6144,2560,8,160,4,2,power_law_1.2,0.44911999702453614
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,6144,2560,8,160,4,2,balanced,1.2471413612365723
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,6144,2560,8,160,4,2,power_law_1.01,0.43480958938598635
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,6144,2560,8,160,4,2,power_law_1.01,0.25114879608154295
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,6144,2560,8,160,4,2,power_law_1.01,0.26439039707183837
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,6144,2560,8,160,4,2,power_law_1.2,0.4758143901824951
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,6144,2560,8,160,4,2,power_law_1.01,0.4468736171722412
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,6144,2560,8,160,4,2,power_law_1.01,0.27492480278015136
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,6144,2560,8,160,4,2,power_law_1.2,0.4796095848083496
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,6144,2560,8,160,4,2,power_law_1.01,0.5326720237731933
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,6144,2560,8,160,4,2,power_law_1.01,0.28908159732818606
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,6144,2560,8,160,4,2,balanced,1.500293254852295
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,6144,2560,8,160,4,2,balanced,2.6922826766967773
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,6144,2560,8,160,4,2,power_law_1.01,0.30935680866241455
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,6144,2560,8,160,4,2,power_law_1.2,0.5034495830535889
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,6144,2560,8,160,4,2,power_law_1.01,0.6167488098144531
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,6144,2560,8,160,4,2,power_law_1.01,0.3360192060470581
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,6144,2560,8,160,4,2,power_law_1.2,0.5176576137542724
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,6144,2560,8,160,4,2,power_law_1.01,0.7923264026641845
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,6144,2560,8,160,4,2,power_law_1.01,0.3460671901702881
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,6144,2560,8,160,4,2,power_law_1.01,0.3941504001617432
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,6144,2560,8,160,4,2,power_law_1.2,0.5577792167663574
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,6144,2560,8,160,4,2,power_law_1.01,1.003993606567383
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,6144,2560,8,160,4,2,balanced,2.1751893361409507
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,6144,2560,8,160,4,2,power_law_1.01,0.43546237945556643
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,6144,2560,8,160,4,2,power_law_1.2,0.5864319801330566
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,6144,2560,8,160,4,2,balanced,6.095263799031575
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,6144,2560,8,160,4,2,power_law_1.01,1.2958080291748046
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,6144,2560,8,160,4,2,power_law_1.2,0.664134407043457
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,6144,2560,8,160,4,2,power_law_1.01,0.4266240119934082
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,6144,2560,8,160,4,2,power_law_1.01,1.538323211669922
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,6144,2560,8,160,4,2,power_law_1.2,0.8252608299255371
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,6144,2560,8,160,4,2,power_law_1.2,0.7964479923248291
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,6144,2560,8,160,4,2,power_law_1.01,2.2153663635253906
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,6144,2560,8,160,4,2,balanced,2.8619893391927085
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,6144,2560,8,160,4,2,power_law_1.2,0.9140480041503907
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,6144,2560,8,160,4,2,power_law_1.01,0.4593599796295166
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,6144,2560,8,160,4,2,power_law_1.01,2.901203155517578
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,6144,2560,8,160,4,2,power_law_1.2,0.9239104270935059
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,6144,2560,8,160,4,2,balanced,3.2026240030924478
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,6144,2560,8,160,4,2,power_law_1.01,3.463283157348633
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,6144,2560,8,160,4,2,power_law_1.2,1.184000015258789
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,6144,2560,8,160,4,2,power_law_1.01,0.546560001373291
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,6144,2560,8,160,4,2,power_law_1.2,1.689401626586914
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,6144,2560,8,160,4,2,power_law_1.01,0.6455808162689209
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,6144,2560,8,160,4,2,power_law_1.01,5.853721618652344
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,6144,2560,8,160,4,2,power_law_1.2,2.1514816284179688
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,6144,2560,8,160,4,2,power_law_1.01,0.8187583923339844
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,6144,2560,8,160,4,2,balanced,4.037247975667317
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,6144,2560,8,160,4,2,power_law_1.2,2.1161472320556642
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,6144,2560,8,160,4,2,power_law_1.01,0.9787712097167969
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,6144,2560,8,160,4,2,power_law_1.01,11.1089599609375
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,6144,2560,8,160,4,2,power_law_1.01,1.2895551681518556
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,6144,2560,8,160,4,2,power_law_1.2,3.0462528228759767
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,6144,2560,8,160,4,2,power_law_1.01,1.676633644104004
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,6144,2560,8,160,4,2,power_law_1.2,3.9740928649902343
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,6144,2560,8,160,4,2,power_law_1.01,2.2715648651123046
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,6144,2560,8,160,4,2,power_law_1.01,3.1949119567871094
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,6144,2560,8,160,4,2,power_law_1.2,5.260723114013672
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,6144,2560,8,160,4,2,power_law_1.01,4.407782363891601
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,6144,2560,8,160,4,2,power_law_1.2,7.319417572021484
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,6144,2560,8,160,4,2,power_law_1.01,5.731647872924805
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,6144,2560,8,160,4,2,balanced,5.417664210001628
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,6144,2560,8,160,4,2,power_law_1.01,7.260063934326172
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,6144,2560,8,160,4,2,power_law_1.2,14.826042175292969
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,6144,2560,8,160,4,2,balanced,5.048538525899251
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,6144,2560,8,160,4,2,power_law_1.01,11.317120361328126
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,6144,2560,8,160,4,2,power_law_1.01,22.22926025390625
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,6144,2560,8,160,4,2,balanced,6.548309326171875
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,6144,2560,8,160,4,2,balanced,11.989471435546875
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,6144,2560,8,160,4,2,balanced,10.450799942016602
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,6144,2560,8,160,4,2,power_law_1.2,0.06700159907341004
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,6144,2560,8,160,4,2,power_law_1.2,0.05989120006561279
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,6144,2560,8,160,4,2,power_law_1.2,0.07747840285301208
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,6144,2560,8,160,4,2,power_law_1.2,0.10229760408401489
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,6144,2560,8,160,4,2,power_law_1.2,0.13723520040512086
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,6144,2560,8,160,4,2,balanced,9.996074676513672
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,6144,2560,8,160,4,2,power_law_1.2,0.21953279972076417
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,6144,2560,8,160,4,2,power_law_1.2,0.2335808038711548
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,6144,2560,8,160,4,2,power_law_1.2,0.24134399890899658
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,6144,2560,8,160,4,2,power_law_1.2,0.26099839210510256
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,6144,2560,8,160,4,2,power_law_1.2,0.2637887954711914
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,6144,2560,8,160,4,2,power_law_1.2,0.27815680503845214
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,6144,2560,8,160,4,2,power_law_1.2,0.2906431913375854
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,6144,2560,8,160,4,2,power_law_1.2,0.30174078941345217
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,6144,2560,8,160,4,2,power_law_1.2,0.3001983880996704
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,6144,2560,8,160,4,2,power_law_1.2,0.314086389541626
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,6144,2560,8,160,4,2,power_law_1.2,0.08124799728393554
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,6144,2560,8,160,4,2,power_law_1.2,0.34010241031646726
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,6144,2560,8,160,4,2,power_law_1.2,0.07551360130310059
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,6144,2560,8,160,4,2,power_law_1.2,0.3746367931365967
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,6144,2560,8,160,4,2,power_law_1.2,0.09251840114593506
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,6144,2560,8,160,4,2,power_law_1.2,0.4410111904144287
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,6144,2560,8,160,4,2,power_law_1.2,0.11360000371932984
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,6144,2560,8,160,4,2,power_law_1.2,0.45656957626342776
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,6144,2560,8,160,4,2,power_law_1.2,0.15115519762039184
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,6144,2560,8,160,4,2,power_law_1.2,0.5681151866912841
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,6144,2560,8,160,4,2,power_law_1.2,0.23795840740203858
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,6144,2560,8,160,4,2,power_law_1.2,0.6617152214050293
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,6144,2560,8,160,4,2,power_law_1.2,0.2583168029785156
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,6144,2560,8,160,4,2,balanced,20.932650248209637
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,6144,2560,8,160,4,2,power_law_1.2,0.8308287620544433
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,6144,2560,8,160,4,2,power_law_1.2,0.2733504056930542
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,6144,2560,8,160,4,2,power_law_1.2,1.0477824211120605
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,6144,2560,8,160,4,2,power_law_1.2,0.275711989402771
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,6144,2560,8,160,4,2,power_law_1.2,1.4012736320495605
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,6144,2560,8,160,4,2,power_law_1.2,0.2959808111190796
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,6144,2560,8,160,4,2,power_law_1.2,1.6700799942016602
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,6144,2560,8,160,4,2,power_law_1.2,0.31535360813140867
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,6144,2560,8,160,4,2,power_law_1.2,0.3407936096191406
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,6144,2560,8,160,4,2,power_law_1.2,2.291315269470215
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,6144,2560,8,160,4,2,power_law_1.2,0.3620287895202637
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,6144,2560,8,160,4,2,power_law_1.2,2.9877695083618163
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,6144,2560,8,160,4,2,power_law_1.2,0.3936064004898071
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,6144,2560,8,160,4,2,power_law_1.2,3.6469566345214846
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,6144,2560,8,160,4,2,power_law_1.2,0.4427775859832764
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,6144,2560,8,160,4,2,power_law_1.2,6.4361213684082035
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,6144,2560,8,160,4,2,power_law_1.2,0.4405695915222168
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,6144,2560,8,160,4,2,power_law_1.2,13.004185485839844
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,6144,2560,8,160,4,2,power_law_1.2,0.4691199779510498
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,6144,2560,8,160,8,1,balanced,0.06900266806284587
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,6144,2560,8,160,4,2,power_law_1.2,0.5628608226776123
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,6144,2560,8,160,8,1,balanced,0.08842133482297261
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,6144,2560,8,160,4,2,power_law_1.2,0.6412415981292725
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,6144,2560,8,160,8,1,balanced,0.1290826698144277
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,6144,2560,8,160,8,1,balanced,0.23278933763504028
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,6144,2560,8,160,8,1,balanced,0.4020479917526245
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,6144,2560,8,160,4,2,power_law_1.2,0.8262144088745117
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,6144,2560,8,160,8,1,balanced,0.5094879865646362
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,6144,2560,8,160,8,1,balanced,0.5103679895401001
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,6144,2560,8,160,4,2,power_law_1.2,1.009267234802246
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,6144,2560,8,160,8,1,balanced,0.5242986679077148
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,6144,2560,8,160,8,1,balanced,0.5300693511962891
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,6144,2560,8,160,4,2,power_law_1.2,1.4125951766967773
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,6144,2560,8,160,8,1,balanced,0.5325440168380737
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,6144,2560,8,160,8,1,balanced,0.057029331723848976
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,6144,2560,8,160,8,1,balanced,0.5270613431930542
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,6144,2560,8,160,4,2,power_law_1.2,1.8587711334228516
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,6144,2560,8,160,8,1,balanced,0.07186133166154225
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,6144,2560,8,160,8,1,balanced,0.5310399929682413
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,6144,2560,8,160,8,1,balanced,0.09673600395520528
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,6144,2560,8,160,8,1,balanced,0.5388586521148682
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,6144,2560,8,160,4,2,power_law_1.2,2.636966323852539
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,6144,2560,8,160,8,1,balanced,0.5539573431015015
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,6144,2560,8,160,8,1,balanced,0.15568533539772034
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,6144,2560,8,160,8,1,balanced,0.5726613203684489
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,6144,2560,8,160,8,1,balanced,0.2579999963442485
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,6144,2560,8,160,4,2,power_law_1.2,3.3933887481689453
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,6144,2560,8,160,8,1,balanced,0.30799466371536255
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,6144,2560,8,160,8,1,balanced,0.5726240078608195
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,6144,2560,8,160,8,1,balanced,0.3128160039583842
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,6144,2560,8,160,4,2,power_law_1.2,4.438079833984375
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,6144,2560,8,160,8,1,balanced,0.5907626549402872
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,6144,2560,8,160,8,1,balanced,0.3129333257675171
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,6144,2560,8,160,8,1,balanced,0.7221120198567709
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,6144,2560,8,160,4,2,power_law_1.2,7.006368255615234
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,6144,2560,8,160,8,1,balanced,0.32094399134318036
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,6144,2560,8,160,8,1,balanced,0.6917973359425863
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,6144,2560,8,160,8,1,balanced,0.3226720094680786
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,6144,2560,8,160,8,1,balanced,0.7938186327616373
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,6144,2560,8,160,4,2,power_law_1.2,8.089702606201172
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,6144,2560,8,160,8,1,power_law_1.01,0.06704000234603882
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,6144,2560,8,160,8,1,balanced,0.32860267162323
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,6144,2560,8,160,8,1,balanced,0.8641706307729086
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,6144,2560,8,160,8,1,balanced,0.33559465408325195
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,6144,2560,8,160,8,1,power_law_1.01,0.0819263994693756
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,6144,2560,8,160,4,2,power_law_1.2,13.022918701171875
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,6144,2560,8,160,8,1,balanced,0.3399893442789714
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,6144,2560,8,160,8,1,power_law_1.01,0.1065600037574768
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,6144,2560,8,160,8,1,balanced,1.3149066766103108
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,6144,2560,8,160,8,1,balanced,0.35630400975545246
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,6144,2560,8,160,8,1,power_law_1.01,0.17717119455337524
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,6144,2560,8,160,8,1,power_law_1.01,0.23041279315948487
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,6144,2560,8,160,8,1,balanced,0.367578665415446
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,6144,2560,8,160,4,2,power_law_1.2,26.47541198730469
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,6144,2560,8,160,8,1,balanced,1.3643199602762859
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,6144,2560,8,160,8,1,power_law_1.01,0.3878400087356567
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,6144,2560,8,160,8,1,balanced,0.37827201684316
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,6144,2560,8,160,8,1,balanced,0.09853333234786987
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,6144,2560,8,160,8,1,power_law_1.01,0.4058432102203369
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,6144,2560,8,160,8,1,balanced,0.3996373414993286
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,6144,2560,8,160,8,1,balanced,2.426959991455078
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,6144,2560,8,160,8,1,power_law_1.01,0.4309823989868164
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,6144,2560,8,160,8,1,balanced,0.10292266805966695
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,6144,2560,8,160,8,1,balanced,0.5387359857559204
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,6144,2560,8,160,8,1,balanced,0.12678933143615723
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,6144,2560,8,160,8,1,power_law_1.01,0.4419136047363281
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,6144,2560,8,160,8,1,balanced,0.5042293469111124
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,6144,2560,8,160,8,1,balanced,0.1807466745376587
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,6144,2560,8,160,8,1,power_law_1.01,0.4424767971038818
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,6144,2560,8,160,8,1,power_law_1.01,0.46826882362365724
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,6144,2560,8,160,8,1,balanced,0.2741973400115967
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,6144,2560,8,160,8,1,balanced,0.668405294418335
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,6144,2560,8,160,8,1,balanced,2.5284533500671387
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,6144,2560,8,160,8,1,balanced,0.3359200159708659
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,6144,2560,8,160,8,1,power_law_1.01,0.4858240127563477
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,6144,2560,8,160,8,1,balanced,0.6722506682078043
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,6144,2560,8,160,8,1,balanced,0.3401706616083781
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,6144,2560,8,160,8,1,power_law_1.01,0.5203711986541748
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,6144,2560,8,160,8,1,balanced,0.3487519820531209
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,6144,2560,8,160,8,1,power_law_1.01,0.5635007858276367
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,6144,2560,8,160,8,1,balanced,1.0034826596577961
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,6144,2560,8,160,8,1,balanced,0.3535733222961426
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,6144,2560,8,160,8,1,power_law_1.01,0.5940351963043213
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,6144,2560,8,160,8,1,balanced,0.36113067468007404
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,6144,2560,8,160,8,1,power_law_1.01,0.6099775791168213
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,6144,2560,8,160,8,1,balanced,4.322490692138672
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,6144,2560,8,160,8,1,balanced,0.37027732531229657
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,6144,2560,8,160,8,1,power_law_1.01,0.6480447769165039
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,6144,2560,8,160,8,1,balanced,1.1268853346506755
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,6144,2560,8,160,8,1,balanced,0.38712533315022785
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,6144,2560,8,160,8,1,power_law_1.01,0.759225606918335
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,6144,2560,8,160,8,1,balanced,0.39907201131184894
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,6144,2560,8,160,8,1,power_law_1.01,0.7614143848419189
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,6144,2560,8,160,8,1,power_law_1.01,0.05264000296592712
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,6144,2560,8,160,8,1,balanced,0.42107200622558594
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,6144,2560,8,160,8,1,power_law_1.01,0.8969663619995117
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,6144,2560,8,160,8,1,balanced,1.7992107073465984
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,6144,2560,8,160,8,1,power_law_1.01,0.0669376015663147
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,6144,2560,8,160,8,1,balanced,0.4530293146769206
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,6144,2560,8,160,8,1,power_law_1.01,1.0095680236816407
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,6144,2560,8,160,8,1,power_law_1.01,0.08470399975776673
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,6144,2560,8,160,8,1,power_law_1.01,1.2454015731811523
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,6144,2560,8,160,8,1,balanced,4.921653429667155
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,6144,2560,8,160,8,1,power_law_1.01,0.12407679557800293
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,6144,2560,8,160,8,1,power_law_1.01,1.8420352935791016
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,6144,2560,8,160,8,1,power_law_1.01,0.15406719446182252
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,6144,2560,8,160,8,1,balanced,2.1399733225504556
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,6144,2560,8,160,8,1,power_law_1.01,2.3603647232055662
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,6144,2560,8,160,8,1,balanced,0.5046773354212443
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,6144,2560,8,160,8,1,power_law_1.01,0.24080638885498046
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,6144,2560,8,160,8,1,power_law_1.01,3.1660287857055662
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,6144,2560,8,160,8,1,power_law_1.01,0.25724799633026124
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,6144,2560,8,160,8,1,power_law_1.01,0.2683135986328125
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,6144,2560,8,160,8,1,power_law_1.01,4.184774398803711
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,6144,2560,8,160,8,1,power_law_1.01,0.28291199207305906
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,6144,2560,8,160,8,1,power_law_1.01,4.906572723388672
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,6144,2560,8,160,8,1,balanced,0.5633546511332194
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,6144,2560,8,160,8,1,power_law_1.01,0.2921087980270386
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,6144,2560,8,160,8,1,balanced,3.1566880544026694
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,6144,2560,8,160,8,1,power_law_1.01,6.151174545288086
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,6144,2560,8,160,8,1,power_law_1.01,0.31198079586029054
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,6144,2560,8,160,8,1,balanced,5.595151901245117
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,6144,2560,8,160,8,1,power_law_1.01,0.3272639989852905
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,6144,2560,8,160,8,1,power_law_1.01,9.487232208251953
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,6144,2560,8,160,8,1,power_law_1.01,0.3532160043716431
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,6144,2560,8,160,8,1,power_law_1.01,0.3440063953399658
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,6144,2560,8,160,8,1,power_law_1.01,0.37455999851226807
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,6144,2560,8,160,8,1,balanced,0.7251733144124349
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,6144,2560,8,160,8,1,power_law_1.01,18.63360595703125
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,6144,2560,8,160,8,1,power_law_1.01,0.38443520069122317
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,6144,2560,8,160,8,1,balanced,0.8399946689605713
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,6144,2560,8,160,8,1,power_law_1.01,0.4320000171661377
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,6144,2560,8,160,8,1,balanced,4.072880109151204
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,6144,2560,8,160,8,1,power_law_1.01,0.5137856006622314
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,6144,2560,8,160,8,1,balanced,1.1023733615875244
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,6144,2560,8,160,8,1,power_law_1.01,0.5575424194335937
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,6144,2560,8,160,8,1,power_law_1.01,0.6894336223602295
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,6144,2560,8,160,8,1,balanced,1.3275360266367595
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,6144,2560,8,160,8,1,power_law_1.01,0.7567103862762451
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,6144,2560,8,160,8,1,balanced,1.9963679313659668
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,6144,2560,8,160,8,1,power_law_1.01,0.9924863815307617
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,6144,2560,8,160,8,1,power_law_1.01,0.08837119936943054
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,6144,2560,8,160,8,1,power_law_1.01,1.3446080207824707
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,6144,2560,8,160,8,1,balanced,8.731541315714518
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,6144,2560,8,160,8,1,power_law_1.01,0.09893119931221009
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,6144,2560,8,160,8,1,power_law_1.01,1.807935905456543
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,6144,2560,8,160,8,1,balanced,2.46724271774292
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,6144,2560,8,160,8,1,balanced,4.701007843017578
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,6144,2560,8,160,8,1,power_law_1.01,0.11191040277481079
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,6144,2560,8,160,8,1,power_law_1.01,2.2096895217895507
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,6144,2560,8,160,8,1,power_law_1.01,0.14902399778366088
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,6144,2560,8,160,8,1,power_law_1.01,3.123142433166504
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,6144,2560,8,160,8,1,power_law_1.01,0.18443520069122316
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,6144,2560,8,160,8,1,balanced,3.6046826044718423
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,6144,2560,8,160,8,1,power_law_1.01,0.2715456008911133
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,6144,2560,8,160,8,1,power_law_1.01,4.2195392608642575
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,6144,2560,8,160,8,1,power_law_1.01,0.2916287899017334
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,6144,2560,8,160,8,1,power_law_1.01,5.115910339355469
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,6144,2560,8,160,8,1,power_law_1.01,0.2981760025024414
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,6144,2560,8,160,8,1,power_law_1.01,0.316646409034729
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,6144,2560,8,160,8,1,power_law_1.01,7.781676483154297
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,6144,2560,8,160,8,1,power_law_1.01,0.3353087902069092
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,6144,2560,8,160,8,1,balanced,4.729983965555827
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,6144,2560,8,160,8,1,power_law_1.2,0.06673920154571533
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,6144,2560,8,160,8,1,power_law_1.01,0.35735039710998534
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,6144,2560,8,160,8,1,power_law_1.2,0.07544320225715637
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,6144,2560,8,160,8,1,power_law_1.01,0.39178879261016847
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,6144,2560,8,160,8,1,power_law_1.01,16.139846801757812
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,6144,2560,8,160,8,1,power_law_1.2,0.09975680112838745
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,6144,2560,8,160,8,1,power_law_1.01,0.4183807849884033
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,6144,2560,8,160,8,1,power_law_1.2,0.15650559663772584
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,6144,2560,8,160,8,1,power_law_1.01,0.4668288230895996
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,6144,2560,8,160,8,1,power_law_1.2,0.21595520973205568
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,6144,2560,8,160,8,1,power_law_1.2,0.37674241065979003
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,6144,2560,8,160,8,1,power_law_1.01,0.5132415771484375
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,6144,2560,8,160,8,1,power_law_1.2,0.40111360549926756
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,6144,2560,8,160,8,1,balanced,7.560480117797852
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,6144,2560,8,160,8,1,balanced,6.747338612874349
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,6144,2560,8,160,8,1,power_law_1.2,0.4297152042388916
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,6144,2560,8,160,8,1,power_law_1.2,0.4426432132720947
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,6144,2560,8,160,8,1,power_law_1.01,0.543071985244751
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,6144,2560,8,160,8,1,power_law_1.2,0.4561215877532959
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,6144,2560,8,160,8,1,power_law_1.2,0.4832064151763916
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,6144,2560,8,160,8,1,power_law_1.2,0.5138239860534668
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,6144,2560,8,160,8,1,power_law_1.2,0.53023362159729
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,6144,2560,8,160,8,1,power_law_1.01,0.6150271892547607
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,6144,2560,8,160,8,1,power_law_1.2,0.5764544010162354
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,6144,2560,8,160,8,1,power_law_1.2,0.61080322265625
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,6144,2560,8,160,8,1,power_law_1.2,0.6286911964416504
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,6144,2560,8,160,8,1,power_law_1.01,0.7470719814300537
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,6144,2560,8,160,8,1,power_law_1.2,0.6521535873413086
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,6144,2560,8,160,8,1,balanced,9.070383707682291
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,6144,2560,8,160,8,1,power_law_1.01,0.8842495918273926
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,6144,2560,8,160,8,1,power_law_1.2,0.7729152202606201
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,6144,2560,8,160,8,1,power_law_1.2,0.773203182220459
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,6144,2560,8,160,8,1,power_law_1.01,1.1467583656311036
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,6144,2560,8,160,8,1,power_law_1.2,0.8993791580200196
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,6144,2560,8,160,8,1,balanced,17.130874633789062
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,6144,2560,8,160,8,1,power_law_1.01,1.4090368270874023
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,6144,2560,8,160,8,1,power_law_1.2,1.0312447547912598
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,6144,2560,8,160,8,1,power_law_1.01,1.9261632919311524
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,6144,2560,8,160,8,1,power_law_1.2,1.3271488189697265
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,6144,2560,8,160,8,1,power_law_1.01,2.4655040740966796
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,6144,2560,8,160,8,1,power_law_1.2,1.8893375396728516
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,6144,2560,8,160,8,1,power_law_1.01,3.5418624877929688
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,6144,2560,8,160,8,1,power_law_1.2,2.4488384246826174
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,6144,2560,8,160,8,1,power_law_1.01,4.614585494995117
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,6144,2560,8,160,8,1,power_law_1.2,3.2657726287841795
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,6144,2560,8,160,8,1,power_law_1.2,0.054790401458740236
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,6144,2560,8,160,8,1,power_law_1.01,6.769741058349609
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,6144,2560,8,160,8,1,balanced,11.054453531901041
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,6144,2560,8,160,8,1,power_law_1.2,4.246912002563477
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,6144,2560,8,160,8,1,power_law_1.2,0.06275839805603027
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,6144,2560,8,160,8,1,power_law_1.2,5.193958282470703
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,6144,2560,8,160,8,1,power_law_1.01,8.901382446289062
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,6144,2560,8,160,8,1,power_law_1.2,0.08329600095748901
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,6144,2560,8,160,8,1,power_law_1.2,0.11185280084609986
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,6144,2560,8,160,8,1,power_law_1.2,6.335103988647461
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,6144,2560,8,160,8,1,power_law_1.2,0.145305597782135
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,6144,2560,8,160,8,1,power_law_1.01,11.042963409423828
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,6144,2560,8,160,8,1,power_law_1.2,0.2408895969390869
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,6144,2560,8,160,8,1,power_law_1.2,9.597325134277344
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,6144,2560,8,160,8,1,power_law_1.2,0.2575103998184204
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,6144,2560,8,160,8,1,power_law_1.01,17.4666748046875
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,6144,2560,8,160,8,1,power_law_1.2,0.2747711896896362
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,6144,2560,8,160,8,1,power_law_1.2,0.2915519952774048
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,6144,2560,8,160,8,1,power_law_1.2,18.55986633300781
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,6144,2560,8,160,8,1,balanced,14.968315124511719
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,6144,2560,8,160,8,1,power_law_1.2,0.30437119007110597
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,6144,2560,8,160,8,1,power_law_1.2,0.3221823930740356
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,6144,2560,8,160,8,1,power_law_1.01,34.64625854492188
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,6144,2560,8,160,8,1,power_law_1.2,0.3392832040786743
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,6144,2560,8,160,8,1,power_law_1.2,0.3497215986251831
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,6144,2560,8,160,8,1,power_law_1.2,0.357856011390686
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,6144,2560,8,160,8,1,power_law_1.2,0.3766527891159058
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,6144,2560,8,160,8,1,balanced,17.786725362141926
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,6144,2560,8,160,8,1,power_law_1.2,0.3891968011856079
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,6144,2560,8,160,8,1,power_law_1.2,0.43856000900268555
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,6144,2560,8,160,8,1,power_law_1.2,0.5178688049316407
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,6144,2560,8,160,8,1,power_law_1.2,0.5703743934631348
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,6144,2560,8,160,8,1,power_law_1.2,0.6969344139099121
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,6144,2560,8,160,8,1,power_law_1.2,0.774073600769043
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,6144,2560,8,160,8,1,power_law_1.2,1.0188672065734863
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,6144,2560,8,160,8,1,power_law_1.2,1.3671615600585938
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,6144,2560,8,160,8,1,power_law_1.2,1.8334272384643555
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,6144,2560,8,160,8,1,power_law_1.2,2.2371904373168947
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,6144,2560,8,160,8,1,power_law_1.2,3.1942975997924803
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,6144,2560,8,160,8,1,power_law_1.2,4.2431999206542965
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,6144,2560,8,160,8,1,power_law_1.2,5.299724960327149
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,6144,2560,8,160,8,1,power_law_1.2,8.008448028564453
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,6144,2560,8,160,8,1,power_law_1.2,16.046380615234376
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,6144,2560,8,160,8,1,power_law_1.2,0.08822399973869324
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,6144,2560,8,160,8,1,balanced,35.27886454264323
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,6144,2560,8,160,8,1,power_law_1.2,0.09895039796829223
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,6144,2560,8,160,8,1,power_law_1.2,0.10820480585098266
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,6144,2560,8,160,8,1,power_law_1.2,0.13985919952392578
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,6144,2560,8,160,8,1,power_law_1.2,0.170905601978302
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,6144,2560,8,160,8,1,power_law_1.2,0.2636607885360718
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,6144,2560,8,160,8,1,power_law_1.2,0.2884799957275391
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,6144,2560,8,160,8,1,power_law_1.2,0.30422399044036863
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,6144,2560,8,160,8,1,power_law_1.2,0.32488958835601806
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,7168,2048,8,384,1,8,balanced,0.07046933472156525
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,6144,2560,8,160,8,1,power_law_1.2,0.34279038906097414
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,7168,2048,8,384,1,8,balanced,0.08201066652933757
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,6144,2560,8,160,8,1,power_law_1.2,0.37226879596710205
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,7168,2048,8,384,1,8,balanced,0.12156800429026286
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,6144,2560,8,160,8,1,power_law_1.2,0.39655680656433107
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,7168,2048,8,384,1,8,balanced,0.20587199926376343
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,6144,2560,8,160,8,1,power_law_1.2,0.4272575855255127
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,7168,2048,8,384,1,8,balanced,0.37459198633829754
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,6144,2560,8,160,8,1,power_law_1.2,0.46908159255981446
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,7168,2048,8,384,1,8,balanced,0.7001653512318929
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,6144,2560,8,160,8,1,power_law_1.2,0.5293632030487061
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,7168,2048,8,384,1,8,balanced,1.0250720183054607
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,7168,2048,8,384,1,8,balanced,1.0248106320699055
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,6144,2560,8,160,8,1,power_law_1.2,0.5565311908721924
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,7168,2048,8,384,1,8,balanced,1.0192533334096272
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,7168,2048,8,384,1,8,balanced,1.0269386768341064
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,7168,2048,8,384,1,8,balanced,1.0426080226898193
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,6144,2560,8,160,8,1,power_law_1.2,0.6307328224182129
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,7168,2048,8,384,1,8,balanced,1.0463306903839111
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,7168,2048,8,384,1,8,balanced,1.0311946868896484
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,6144,2560,8,160,8,1,power_law_1.2,0.7501760005950928
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,7168,2048,8,384,1,8,balanced,1.0392533143361409
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,6144,2560,8,160,8,1,power_law_1.2,0.8841152191162109
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,7168,2048,8,384,1,8,balanced,1.0326293309529622
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,6144,2560,8,160,8,1,power_law_1.2,1.1582079887390138
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,7168,2048,8,384,1,8,balanced,1.0392106374104817
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,6144,2560,8,160,8,1,power_law_1.2,1.41146879196167
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,7168,2048,8,384,1,8,balanced,1.0490453243255615
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,6144,2560,8,160,8,1,power_law_1.2,1.943552017211914
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,7168,2048,8,384,1,8,balanced,1.06605863571167
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,6144,2560,8,160,8,1,power_law_1.2,2.4888383865356447
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,7168,2048,8,384,1,8,balanced,0.05558399856090546
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,7168,2048,8,384,1,8,balanced,1.101802666982015
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,6144,2560,8,160,8,1,power_law_1.2,3.558553695678711
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,7168,2048,8,384,1,8,balanced,0.06321600079536438
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,7168,2048,8,384,1,8,balanced,1.1424799760182698
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,7168,2048,8,384,1,8,balanced,0.08275199929873149
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,6144,2560,8,160,8,1,power_law_1.2,4.620748901367188
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,7168,2048,8,384,1,8,balanced,0.1293333371480306
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,6144,2560,8,160,8,1,power_law_1.2,6.771443176269531
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,7168,2048,8,384,1,8,balanced,1.1666560173034668
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,7168,2048,8,384,1,8,balanced,0.20975999037424722
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,7168,2048,8,384,1,8,balanced,0.3778293530146281
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,6144,2560,8,160,8,1,power_law_1.2,8.88817901611328
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,7168,2048,8,384,1,8,balanced,0.5453973213831583
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,7168,2048,8,384,1,8,balanced,1.2268373171488445
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,7168,2048,8,384,1,8,balanced,0.5331893364588419
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,6144,2560,8,160,8,1,power_law_1.2,11.018201446533203
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,7168,2048,8,384,1,8,balanced,0.5345226526260376
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,7168,2048,8,384,1,8,balanced,0.5350346565246582
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,7168,2048,8,384,1,8,balanced,1.3012906710306804
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,7168,2048,8,384,1,8,balanced,0.5416693290074667
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,6144,2560,8,160,8,1,power_law_1.2,17.430950927734376
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,7168,2048,8,384,1,8,balanced,0.5449173450469971
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,7168,2048,8,384,1,8,balanced,0.5495200157165527
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,7168,2048,8,384,1,8,balanced,0.5526826779047648
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,7168,2048,8,384,1,8,balanced,1.3986560503641765
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,6144,2560,8,160,8,1,power_law_1.2,34.61930847167969
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,7168,2048,8,384,1,8,balanced,0.561029314994812
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,7168,2048,8,384,1,8,balanced,0.057349334160486855
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,7168,2048,8,384,1,8,balanced,0.5662613312403361
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,7168,2048,8,384,1,8,balanced,0.06651733318964641
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,7168,2048,8,384,1,8,balanced,0.5768320163091024
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,7168,2048,8,384,1,8,power_law_1.01,0.20042240619659424
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,7168,2048,8,384,1,8,power_law_1.01,0.133024001121521
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,7168,2048,8,384,1,8,balanced,1.760650634765625
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,7168,2048,8,384,1,8,balanced,0.09084799885749817
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,7168,2048,8,384,1,8,balanced,0.5958453416824341
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,7168,2048,8,384,1,8,power_law_1.01,0.3635008096694946
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,7168,2048,8,384,1,8,balanced,0.13964800039927164
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,7168,2048,8,384,1,8,power_law_1.01,0.20139520168304442
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,7168,2048,8,384,1,8,power_law_1.01,0.6791872024536133
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,7168,2048,8,384,1,8,balanced,0.6133653322855631
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,7168,2048,8,384,1,8,balanced,0.21802133321762085
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,7168,2048,8,384,1,8,power_law_1.01,0.3652928113937378
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,7168,2048,8,384,1,8,balanced,0.37595200538635254
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,7168,2048,8,384,1,8,power_law_1.01,0.19697920083999634
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,7168,2048,8,384,1,8,balanced,0.6492906808853149
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,7168,2048,8,384,1,8,power_law_1.01,0.1337407946586609
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,7168,2048,8,384,1,8,balanced,0.5393600066502889
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,7168,2048,8,384,1,8,power_law_1.01,0.30969600677490233
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,7168,2048,8,384,1,8,power_law_1.01,0.16967040300369263
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,7168,2048,8,384,1,8,balanced,0.5391733249028524
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,7168,2048,8,384,1,8,balanced,0.6828587055206299
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,7168,2048,8,384,1,8,power_law_1.01,0.5121984004974365
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,7168,2048,8,384,1,8,balanced,1.9336907068888347
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,7168,2048,8,384,1,8,power_law_1.01,0.27917439937591554
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,7168,2048,8,384,1,8,balanced,0.5405439933141073
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,7168,2048,8,384,1,8,power_law_1.01,0.5400447845458984
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,7168,2048,8,384,1,8,balanced,0.5436906814575195
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,7168,2048,8,384,1,8,balanced,0.7451679706573486
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,7168,2048,8,384,1,8,power_law_1.01,0.310860800743103
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,7168,2048,8,384,1,8,power_law_1.01,0.7099391937255859
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,7168,2048,8,384,1,8,balanced,0.5452693303426107
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,7168,2048,8,384,1,8,power_law_1.01,0.3566848039627075
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,7168,2048,8,384,1,8,power_law_1.01,0.7084288120269775
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,7168,2048,8,384,1,8,balanced,0.5496160189310709
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,7168,2048,8,384,1,8,power_law_1.01,0.382207989692688
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,7168,2048,8,384,1,8,balanced,0.8255946636199951
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,7168,2048,8,384,1,8,power_law_1.01,0.7302720069885253
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,7168,2048,8,384,1,8,balanced,0.550927996635437
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,7168,2048,8,384,1,8,power_law_1.01,0.3866175889968872
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,7168,2048,8,384,1,8,power_law_1.01,0.7902527809143066
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,7168,2048,8,384,1,8,balanced,0.5552213191986084
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,7168,2048,8,384,1,8,power_law_1.01,0.4005760192871094
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,7168,2048,8,384,1,8,balanced,0.5660853385925293
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,7168,2048,8,384,1,8,power_law_1.01,0.8586496353149414
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,7168,2048,8,384,1,8,balanced,2.678442637125651
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,7168,2048,8,384,1,8,balanced,0.9425280094146729
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,7168,2048,8,384,1,8,power_law_1.01,0.4508096218109131
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,7168,2048,8,384,1,8,balanced,0.5712159872055054
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,7168,2048,8,384,1,8,power_law_1.01,0.7895872116088867
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,7168,2048,8,384,1,8,power_law_1.01,0.43551998138427733
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,7168,2048,8,384,1,8,balanced,0.5856800079345703
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,7168,2048,8,384,1,8,power_law_1.01,0.8783424377441407
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,7168,2048,8,384,1,8,power_law_1.01,0.46528639793396
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,7168,2048,8,384,1,8,balanced,0.6127573251724243
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,7168,2048,8,384,1,8,power_law_1.01,0.884768009185791
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,7168,2048,8,384,1,8,power_law_1.01,0.5172095775604248
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,7168,2048,8,384,1,8,power_law_1.01,0.8941632270812988
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,7168,2048,8,384,1,8,balanced,1.2096266746520996
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,7168,2048,8,384,1,8,power_law_1.01,0.5139135837554931
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,7168,2048,8,384,1,8,power_law_1.01,0.9553728103637695
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,7168,2048,8,384,1,8,power_law_1.01,0.516044807434082
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,7168,2048,8,384,1,8,power_law_1.01,1.038707160949707
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,384,1,8,balanced,0.6373546520868937
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,7168,2048,8,384,1,8,power_law_1.01,0.585811185836792
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,7168,2048,8,384,1,8,power_law_1.01,1.216108798980713
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,7168,2048,8,384,1,8,balanced,3.401119867960612
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,7168,2048,8,384,1,8,power_law_1.01,0.6541312217712403
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,7168,2048,8,384,1,8,power_law_1.01,1.6075519561767577
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,7168,2048,8,384,1,8,power_law_1.01,0.7375423908233643
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,7168,2048,8,384,1,8,balanced,1.4483946164449055
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,7168,2048,8,384,1,8,power_law_1.01,1.4355199813842774
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,7168,2048,8,384,1,8,power_law_1.01,0.8049216270446777
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,7168,2048,8,384,1,8,power_law_1.01,1.7559999465942382
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,7168,2048,8,384,1,8,power_law_1.2,0.22275838851928711
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,7168,2048,8,384,1,8,power_law_1.01,0.937228775024414
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,7168,2048,8,384,1,8,power_law_1.01,1.5571840286254883
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,7168,2048,8,384,1,8,power_law_1.2,0.36246399879455565
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,7168,2048,8,384,1,8,power_law_1.01,1.039795207977295
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,384,1,8,balanced,0.6982346375783285
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,7168,2048,8,384,1,8,power_law_1.01,2.074227142333984
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,7168,2048,8,384,1,8,power_law_1.01,0.14048000574111938
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,7168,2048,8,384,1,8,power_law_1.2,0.27489280700683594
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,7168,2048,8,384,1,8,power_law_1.01,1.2996735572814941
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,7168,2048,8,384,1,8,power_law_1.01,2.5472063064575194
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,7168,2048,8,384,1,8,power_law_1.01,0.22109439373016357
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,7168,2048,8,384,1,8,power_law_1.2,0.20067839622497557
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,384,1,8,balanced,0.7550933361053467
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,7168,2048,8,384,1,8,power_law_1.01,1.694380760192871
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,7168,2048,8,384,1,8,power_law_1.01,0.3843071937561035
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,7168,2048,8,384,1,8,power_law_1.2,0.30692479610443113
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,7168,2048,8,384,1,8,power_law_1.01,3.3466560363769533
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,7168,2048,8,384,1,8,power_law_1.01,0.14810240268707275
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,7168,2048,8,384,1,8,balanced,1.9751092592875164
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,7168,2048,8,384,1,8,power_law_1.01,2.165439987182617
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,7168,2048,8,384,1,8,power_law_1.2,0.41768321990966795
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,384,1,8,balanced,0.8621333440144857
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,7168,2048,8,384,1,8,power_law_1.01,0.19541759490966798
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,7168,2048,8,384,1,8,power_law_1.01,3.7033409118652343
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,7168,2048,8,384,1,8,power_law_1.01,0.28103039264678953
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,7168,2048,8,384,1,8,power_law_1.01,2.4510847091674806
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,7168,2048,8,384,1,8,power_law_1.2,0.4788224220275879
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,7168,2048,8,384,1,8,power_law_1.01,0.2997312068939209
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,7168,2048,8,384,1,8,power_law_1.01,4.775411224365234
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,7168,2048,8,384,1,8,power_law_1.2,0.6892608165740967
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,384,1,8,balanced,1.0256000359853108
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,7168,2048,8,384,1,8,power_law_1.01,0.38296959400177
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,7168,2048,8,384,1,8,power_law_1.01,3.1155263900756838
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,7168,2048,8,384,1,8,balanced,5.08784548441569
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,7168,2048,8,384,1,8,power_law_1.2,0.6921216011047363
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,7168,2048,8,384,1,8,power_law_1.01,0.42446079254150393
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,7168,2048,8,384,1,8,power_law_1.01,7.072038269042968
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,7168,2048,8,384,1,8,power_law_1.01,0.40758399963378905
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,7168,2048,8,384,1,8,power_law_1.01,4.939238357543945
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,7168,2048,8,384,1,8,power_law_1.2,0.7177343845367432
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,7168,2048,8,384,1,8,power_law_1.01,0.42968320846557617
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,7168,2048,8,384,1,8,power_law_1.2,0.7700352191925048
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,384,1,8,balanced,1.2125813166300456
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,7168,2048,8,384,1,8,power_law_1.01,0.4401855945587158
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,7168,2048,8,384,1,8,power_law_1.01,12.76192626953125
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,7168,2048,8,384,1,8,power_law_1.01,9.354303741455078
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,7168,2048,8,384,1,8,power_law_1.2,0.8227007865905762
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,7168,2048,8,384,1,8,power_law_1.01,0.4726912021636963
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,7168,2048,8,384,1,8,power_law_1.01,0.5096255779266358
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,7168,2048,8,384,1,8,power_law_1.2,0.8463871955871582
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,7168,2048,8,384,1,8,balanced,2.5305867195129395
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,7168,2048,8,384,1,8,power_law_1.01,0.5362688064575195
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,7168,2048,8,384,1,8,power_law_1.2,0.8203007698059082
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,7168,2048,8,384,1,8,power_law_1.01,0.5588672161102295
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,384,1,8,balanced,1.7717547416687012
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,7168,2048,8,384,1,8,power_law_1.01,0.6615295886993409
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,7168,2048,8,384,1,8,power_law_1.2,0.9248512268066407
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,7168,2048,8,384,1,8,power_law_1.01,0.7669248104095459
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,7168,2048,8,384,1,8,power_law_1.2,0.888377571105957
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,7168,2048,8,384,1,8,power_law_1.2,0.9710463523864746
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,384,1,8,power_law_1.01,0.7716415882110595
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,7168,2048,8,384,1,8,power_law_1.2,1.146406364440918
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,7168,2048,8,384,1,8,power_law_1.2,1.2648768424987793
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,384,1,8,balanced,2.1660106976826987
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,384,1,8,power_law_1.01,0.7901951789855957
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,7168,2048,8,384,1,8,power_law_1.2,1.6830848693847655
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,384,1,8,power_law_1.01,0.9201984405517578
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,7168,2048,8,384,1,8,power_law_1.2,1.4919936180114746
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,384,1,8,power_law_1.01,1.2217087745666504
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,384,1,8,power_law_1.01,1.3204607963562012
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,7168,2048,8,384,1,8,power_law_1.2,1.9079679489135741
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,384,1,8,power_law_1.01,1.7957696914672852
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,7168,2048,8,384,1,8,power_law_1.2,1.7345792770385742
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,384,1,8,power_law_1.01,2.2275968551635743
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,7168,2048,8,384,1,8,balanced,3.7268425623575845
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,7168,2048,8,384,1,8,power_law_1.2,2.2579072952270507
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,384,1,8,power_law_1.01,3.155276870727539
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,384,1,8,balanced,3.0052267710367837
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,7168,2048,8,384,1,8,power_law_1.2,2.9748735427856445
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,384,1,8,power_law_1.01,4.135200119018554
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,7168,2048,8,384,1,8,power_law_1.2,3.985996627807617
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,384,1,8,power_law_1.01,5.315545654296875
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,7168,2048,8,384,1,8,power_law_1.2,4.792524719238282
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,384,1,8,power_law_1.01,7.762687683105469
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,7168,2048,8,384,1,8,power_law_1.2,5.220582580566406
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,7168,2048,8,384,1,8,balanced,9.366154352823893
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,384,1,8,power_law_1.01,16.09032287597656
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,7168,2048,8,384,1,8,power_law_1.2,8.911622619628906
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,384,1,8,balanced,3.8552160263061523
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,7168,2048,8,384,1,8,power_law_1.2,15.90497283935547
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,7168,2048,8,384,1,8,power_law_1.2,0.13327360153198242
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,7168,2048,8,384,1,8,power_law_1.2,0.2021951913833618
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,7168,2048,8,384,1,8,power_law_1.2,0.22062718868255615
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,7168,2048,8,384,1,8,power_law_1.2,0.12711039781570435
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,7168,2048,8,384,1,8,power_law_1.2,0.17292159795761108
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,7168,2048,8,384,1,8,power_law_1.2,0.2356800079345703
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,7168,2048,8,384,1,8,power_law_1.2,0.28549120426177976
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,384,1,8,balanced,5.965866724650065
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,7168,2048,8,384,1,8,power_law_1.2,0.3431616067886353
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,7168,2048,8,384,1,8,power_law_1.2,0.38385920524597167
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,7168,2048,8,384,1,8,balanced,7.005930582682292
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,7168,2048,8,384,1,8,power_law_1.2,0.38073599338531494
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,7168,2048,8,384,1,8,power_law_1.2,0.4102719783782959
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,7168,2048,8,384,1,8,power_law_1.2,0.42999677658081054
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,7168,2048,8,384,1,8,power_law_1.2,0.4118080139160156
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,7168,2048,8,384,1,8,power_law_1.2,0.4810880184173584
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,7168,2048,8,384,1,8,power_law_1.2,0.4918079853057861
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,7168,2048,8,384,1,8,power_law_1.2,0.5498559951782227
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,7168,2048,8,384,1,8,power_law_1.2,0.5146368026733399
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,7168,2048,8,384,1,8,power_law_1.2,0.550707197189331
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,7168,2048,8,384,1,8,power_law_1.2,0.6817279815673828
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,7168,2048,8,384,1,8,power_law_1.2,0.7987391948699951
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,7168,2048,8,384,1,8,power_law_1.2,0.8881983757019043
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,7168,2048,8,384,1,8,power_law_1.2,1.0410112380981444
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,7168,2048,8,384,1,8,power_law_1.2,1.0515456199645996
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,7168,2048,8,384,1,8,power_law_1.2,1.3675456047058105
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,7168,2048,8,384,1,8,power_law_1.2,1.7824064254760743
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,7168,2048,8,384,1,8,power_law_1.2,2.5344703674316404
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,7168,2048,8,384,1,8,power_law_1.2,3.072774314880371
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,384,1,8,balanced,11.698874155680338
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,7168,2048,8,384,1,8,power_law_1.2,3.4468673706054687
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,7168,2048,8,384,1,8,power_law_1.2,5.683852767944336
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,7168,2048,8,384,1,8,power_law_1.2,11.261650848388673
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,7168,2048,8,384,2,4,balanced,0.06755200028419495
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,7168,2048,8,384,2,4,balanced,0.08336533109347026
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,7168,2048,8,384,2,4,balanced,0.12141866485277812
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,7168,2048,8,384,2,4,balanced,0.20946667591730753
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,7168,2048,8,384,1,8,power_law_1.2,0.13853440284729004
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,7168,2048,8,384,2,4,balanced,0.3705973227818807
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,7168,2048,8,384,2,4,balanced,0.6906507015228271
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,7168,2048,8,384,1,8,power_law_1.2,0.22036480903625488
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,7168,2048,8,384,2,4,balanced,1.0141173203786213
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,7168,2048,8,384,1,8,power_law_1.2,0.18252160549163818
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,7168,2048,8,384,2,4,balanced,1.021621306737264
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,7168,2048,8,384,1,8,power_law_1.2,0.14012160301208496
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,7168,2048,8,384,2,4,balanced,1.02238933245341
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,7168,2048,8,384,1,8,power_law_1.2,0.19247360229492189
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,7168,2048,8,384,2,4,balanced,1.0301012992858887
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,7168,2048,8,384,2,4,balanced,1.0191360314687092
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,7168,2048,8,384,1,8,power_law_1.2,0.2544447898864746
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,7168,2048,8,384,2,4,balanced,1.0293280283610027
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,7168,2048,8,384,1,8,power_law_1.2,0.2796607971191406
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,7168,2048,8,384,2,4,balanced,1.0381120045979817
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,7168,2048,8,384,1,8,power_law_1.2,0.37969279289245605
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,7168,2048,8,384,2,4,balanced,1.0323839982350667
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,7168,2048,8,384,1,8,power_law_1.2,0.3949376106262207
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,7168,2048,8,384,2,4,balanced,1.0409973462422688
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,7168,2048,8,384,1,8,power_law_1.2,0.3926527976989746
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,7168,2048,8,384,2,4,balanced,1.0491893291473389
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,7168,2048,8,384,1,8,power_law_1.2,0.41608319282531736
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,7168,2048,8,384,2,4,balanced,1.057744026184082
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,7168,2048,8,384,1,8,power_law_1.2,0.4810944080352783
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,7168,2048,8,384,2,4,balanced,1.0850666364034016
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,7168,2048,8,384,1,8,power_law_1.2,0.4516928195953369
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,7168,2048,8,384,2,4,balanced,1.1182400385538738
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,7168,2048,8,384,1,8,power_law_1.2,0.5128448009490967
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,7168,2048,8,384,2,4,balanced,0.05256533126036326
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,7168,2048,8,384,2,4,balanced,1.1602400143941243
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,7168,2048,8,384,1,8,power_law_1.2,0.5489535808563233
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,7168,2048,8,384,2,4,balanced,0.06403733293215434
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,7168,2048,8,384,2,4,balanced,0.0841919978459676
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,7168,2048,8,384,1,8,power_law_1.2,0.6154304027557373
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,7168,2048,8,384,2,4,balanced,1.2035253047943115
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,7168,2048,8,384,2,4,balanced,0.12971733013788858
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,7168,2048,8,384,2,4,balanced,0.2099626660346985
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,7168,2048,8,384,1,8,power_law_1.2,0.6626431941986084
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,7168,2048,8,384,2,4,balanced,0.3730400005976359
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,7168,2048,8,384,1,8,power_law_1.2,0.7887872219085693
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,7168,2048,8,384,2,4,balanced,0.5402826468149821
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,7168,2048,8,384,2,4,balanced,1.2779200077056885
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,7168,2048,8,384,2,4,balanced,0.5390026569366455
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,7168,2048,8,384,2,4,power_law_1.01,0.13133440017700196
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,7168,2048,8,384,2,4,balanced,0.5413386821746826
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,7168,2048,8,384,2,4,balanced,0.5409813324610392
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,7168,2048,8,384,2,4,power_law_1.01,0.20044159889221191
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,384,1,8,power_law_1.2,0.828831958770752
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,7168,2048,8,384,2,4,balanced,1.384698708852132
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,7168,2048,8,384,2,4,balanced,0.5522986650466919
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,7168,2048,8,384,2,4,balanced,0.5542933146158854
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,7168,2048,8,384,2,4,power_law_1.01,0.36382720470428465
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,7168,2048,8,384,2,4,balanced,0.07144000132878621
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,7168,2048,8,384,2,4,balanced,0.5598826805750529
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,7168,2048,8,384,2,4,power_law_1.01,0.1822208046913147
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,7168,2048,8,384,2,4,balanced,0.5647626717885336
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,384,1,8,power_law_1.2,0.8502655982971191
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,7168,2048,8,384,2,4,balanced,0.0795306662718455
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,7168,2048,8,384,2,4,power_law_1.01,0.30023040771484377
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,7168,2048,8,384,2,4,balanced,0.5724426507949829
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,7168,2048,8,384,2,4,balanced,1.5227519671122234
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,384,1,8,power_law_1.2,1.0309120178222657
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,7168,2048,8,384,2,4,balanced,0.09650133053461711
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,7168,2048,8,384,2,4,balanced,0.5852320194244385
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,7168,2048,8,384,2,4,power_law_1.01,0.45078401565551757
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,7168,2048,8,384,2,4,balanced,0.5969653526941935
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,7168,2048,8,384,2,4,balanced,0.14800533652305603
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,384,1,8,power_law_1.2,1.3078144073486329
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,7168,2048,8,384,2,4,power_law_1.01,0.5162559986114502
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,7168,2048,8,384,2,4,balanced,0.22535467147827148
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,7168,2048,8,384,2,4,balanced,0.6122773488362631
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,384,1,8,power_law_1.2,1.488755226135254
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,7168,2048,8,384,2,4,power_law_1.01,0.7085631847381592
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,7168,2048,8,384,2,4,balanced,0.38333332538604736
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,7168,2048,8,384,2,4,balanced,0.6315733194351196
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,7168,2048,8,384,2,4,balanced,1.8991200129191081
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,384,1,8,power_law_1.2,2.040947151184082
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,7168,2048,8,384,2,4,power_law_1.01,0.740390396118164
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,7168,2048,8,384,2,4,balanced,0.5495680173238119
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,7168,2048,8,384,2,4,balanced,0.6791573365529379
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,7168,2048,8,384,2,4,balanced,0.5516000191370646
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,7168,2048,8,384,2,4,power_law_1.01,0.7177984237670898
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,384,1,8,power_law_1.2,2.616070365905762
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,7168,2048,8,384,2,4,balanced,0.7368533611297607
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,7168,2048,8,384,2,4,balanced,0.5521066586176554
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,7168,2048,8,384,2,4,power_law_1.01,0.7545407772064209
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,384,1,8,power_law_1.2,3.636217498779297
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,7168,2048,8,384,2,4,balanced,0.5555413166681925
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,7168,2048,8,384,2,4,power_law_1.01,0.7893119812011719
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,7168,2048,8,384,2,4,balanced,0.8173333009084066
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,7168,2048,8,384,2,4,balanced,0.5584959983825684
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,384,1,8,power_law_1.2,4.8030143737792965
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,7168,2048,8,384,2,4,power_law_1.01,0.8114239692687988
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,7168,2048,8,384,2,4,balanced,2.1803733507792153
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,7168,2048,8,384,2,4,balanced,0.5664426485697428
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,7168,2048,8,384,2,4,power_law_1.01,0.0870527982711792
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,7168,2048,8,384,2,4,balanced,0.9124639828999838
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,384,1,8,power_law_1.2,6.215539169311524
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,7168,2048,8,384,2,4,power_law_1.01,0.852511978149414
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,7168,2048,8,384,2,4,balanced,0.5695679982503256
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,7168,2048,8,384,2,4,power_law_1.01,0.12281600236892701
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,7168,2048,8,384,2,4,power_law_1.01,0.8828543663024903
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,7168,2048,8,384,2,4,balanced,0.581216017405192
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,384,1,8,power_law_1.2,10.501824188232423
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,7168,2048,8,384,2,4,power_law_1.01,0.2056960105895996
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,7168,2048,8,384,2,4,power_law_1.01,0.8908479690551758
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,7168,2048,8,384,2,4,balanced,1.0853599707285564
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,7168,2048,8,384,2,4,balanced,0.5960426727930704
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,7168,2048,8,384,2,4,power_law_1.01,0.11619199514389038
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,7168,2048,8,384,2,4,power_law_1.01,0.9285056114196777
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,7168,2048,8,384,2,4,balanced,0.604640007019043
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,7168,2048,8,384,2,4,power_law_1.01,0.17002880573272705
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,384,1,8,power_law_1.2,19.174496459960938
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,7168,2048,8,384,2,4,power_law_1.01,1.0562432289123536
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,7168,2048,8,384,2,4,balanced,0.6216479937235514
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,7168,2048,8,384,2,4,power_law_1.01,0.2599616050720215
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,7168,2048,8,384,2,4,power_law_1.01,1.16310396194458
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,7168,2048,8,384,2,4,balanced,3.0074294408162436
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,7168,2048,8,384,2,4,balanced,1.3887252807617188
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,7168,2048,8,384,2,4,balanced,0.6606026490529379
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,7168,2048,8,384,2,4,power_law_1.01,0.2890559911727905
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,7168,2048,8,384,2,4,power_law_1.01,1.3229248046875
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,7168,2048,8,384,2,4,power_law_1.01,0.3714560031890869
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,7168,2048,8,384,2,4,power_law_1.01,1.4186944007873534
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,7168,2048,8,384,2,4,power_law_1.01,0.3916032075881958
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,7168,2048,8,384,2,4,power_law_1.01,1.7871936798095702
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,7168,2048,8,384,2,4,power_law_1.01,0.39213440418243406
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,384,2,4,balanced,0.7249279816945394
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,7168,2048,8,384,2,4,power_law_1.01,1.5960384368896485
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,7168,2048,8,384,2,4,balanced,1.7176906267801921
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,7168,2048,8,384,2,4,power_law_1.01,0.40416641235351564
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,7168,2048,8,384,2,4,power_law_1.01,1.8660160064697267
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,7168,2048,8,384,2,4,power_law_1.01,0.4246335983276367
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,7168,2048,8,384,2,4,power_law_1.01,2.4479743957519533
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,7168,2048,8,384,2,4,balanced,3.9656960169474282
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,7168,2048,8,384,2,4,power_law_1.01,0.4334911823272705
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,7168,2048,8,384,2,4,power_law_1.01,3.352159881591797
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,7168,2048,8,384,2,4,power_law_1.01,0.4675456047058105
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,7168,2048,8,384,2,4,power_law_1.01,3.9422401428222655
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,7168,2048,8,384,2,4,power_law_1.01,0.4809279918670654
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,384,2,4,balanced,0.8283786773681641
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,7168,2048,8,384,2,4,balanced,2.320064067840576
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,7168,2048,8,384,2,4,power_law_1.01,4.7280830383300785
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,7168,2048,8,384,2,4,power_law_1.01,0.5255104064941406
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,7168,2048,8,384,2,4,power_law_1.01,0.519046401977539
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,384,2,4,balanced,0.91212264696757
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,7168,2048,8,384,2,4,power_law_1.01,0.5939648151397705
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,7168,2048,8,384,2,4,power_law_1.01,7.217491149902344
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,7168,2048,8,384,2,4,power_law_1.01,0.10941439867019653
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,7168,2048,8,384,2,4,power_law_1.01,0.6640128135681153
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,384,2,4,balanced,1.052016019821167
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,7168,2048,8,384,2,4,power_law_1.01,0.7801407814025879
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,7168,2048,8,384,2,4,power_law_1.01,0.14803839921951295
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,7168,2048,8,384,2,4,power_law_1.01,14.750643920898437
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,7168,2048,8,384,2,4,power_law_1.01,0.8047807693481446
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,7168,2048,8,384,2,4,power_law_1.01,0.23028481006622314
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,384,2,4,balanced,1.3026026884714763
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,7168,2048,8,384,2,4,power_law_1.01,0.9769151687622071
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,7168,2048,8,384,2,4,power_law_1.01,0.13137919902801515
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,7168,2048,8,384,2,4,balanced,2.9389120737711587
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,7168,2048,8,384,2,4,power_law_1.01,1.021350383758545
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,7168,2048,8,384,2,4,power_law_1.01,0.20161919593811034
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,7168,2048,8,384,2,4,power_law_1.2,0.13065600395202637
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,7168,2048,8,384,2,4,balanced,5.610191980997722
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,7168,2048,8,384,2,4,power_law_1.01,1.2825599670410157
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,7168,2048,8,384,2,4,power_law_1.01,0.2575040102005005
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,384,2,4,balanced,1.6119146347045898
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,7168,2048,8,384,2,4,power_law_1.2,0.19955840110778808
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,7168,2048,8,384,2,4,power_law_1.01,1.699033546447754
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,7168,2048,8,384,2,4,power_law_1.01,0.3035007953643799
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,7168,2048,8,384,2,4,power_law_1.2,0.20677759647369384
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,7168,2048,8,384,2,4,power_law_1.01,2.2902719497680666
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,7168,2048,8,384,2,4,power_law_1.01,0.37569279670715333
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,7168,2048,8,384,2,4,power_law_1.2,0.19033600091934205
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,7168,2048,8,384,2,4,power_law_1.01,0.3910399913787842
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,7168,2048,8,384,2,4,power_law_1.01,2.7123392105102537
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,384,2,4,balanced,2.362191994984945
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,7168,2048,8,384,2,4,power_law_1.2,0.2756671905517578
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,7168,2048,8,384,2,4,power_law_1.01,0.42057600021362307
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,7168,2048,8,384,2,4,power_law_1.01,3.3847808837890625
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,7168,2048,8,384,2,4,power_law_1.2,0.379584002494812
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,7168,2048,8,384,2,4,power_law_1.01,0.4264512062072754
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,7168,2048,8,384,2,4,power_law_1.2,0.48657917976379395
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,7168,2048,8,384,2,4,power_law_1.01,4.9869953155517575
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,7168,2048,8,384,2,4,power_law_1.01,0.4564223766326904
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,7168,2048,8,384,2,4,power_law_1.2,0.6525440216064453
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,7168,2048,8,384,2,4,power_law_1.01,0.4531712055206299
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,7168,2048,8,384,2,4,power_law_1.2,0.6752255916595459
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,7168,2048,8,384,2,4,power_law_1.01,9.913037109375
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,384,2,4,balanced,2.9741493860880532
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,7168,2048,8,384,2,4,power_law_1.01,0.5172927856445313
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,7168,2048,8,384,2,4,balanced,4.415984153747559
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,7168,2048,8,384,2,4,power_law_1.2,0.7072319984436035
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,7168,2048,8,384,2,4,power_law_1.01,0.5447296142578125
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,7168,2048,8,384,2,4,power_law_1.2,0.7503232002258301
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,7168,2048,8,384,2,4,power_law_1.01,0.5996799945831299
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,7168,2048,8,384,2,4,power_law_1.2,0.7558271884918213
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,7168,2048,8,384,2,4,power_law_1.01,0.6667456150054931
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,7168,2048,8,384,2,4,power_law_1.2,0.7840191841125488
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,7168,2048,8,384,2,4,power_law_1.01,0.7818943977355957
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,7168,2048,8,384,2,4,power_law_1.2,0.8373824119567871
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,384,2,4,balanced,4.120138804117839
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,7168,2048,8,384,2,4,power_law_1.2,0.8772224426269531
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,384,2,4,power_law_1.01,0.8289343833923339
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,7168,2048,8,384,2,4,power_law_1.2,0.8908415794372558
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,7168,2048,8,384,2,4,power_law_1.2,0.9957119941711425
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,384,2,4,power_law_1.01,0.9159616470336914
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,7168,2048,8,384,2,4,power_law_1.2,1.1305919647216798
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,384,2,4,power_law_1.01,1.0534720420837402
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,7168,2048,8,384,2,4,power_law_1.2,1.2052160263061524
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,384,2,4,power_law_1.01,1.355782413482666
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,7168,2048,8,384,2,4,balanced,10.519925435384115
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,7168,2048,8,384,2,4,power_law_1.2,1.4098112106323242
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,384,2,4,power_law_1.01,1.5308416366577149
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,7168,2048,8,384,2,4,power_law_1.2,1.5250432014465332
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,384,2,4,balanced,5.2473494211832685
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,384,2,4,power_law_1.01,2.0963199615478514
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,7168,2048,8,384,2,4,power_law_1.2,1.9882495880126954
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,384,2,4,power_law_1.01,2.6703168869018556
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,7168,2048,8,384,2,4,power_law_1.2,1.649977684020996
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,384,2,4,power_law_1.01,3.826425552368164
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,7168,2048,8,384,2,4,power_law_1.2,2.0457151412963865
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,384,2,4,power_law_1.01,5.054719924926758
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,7168,2048,8,384,2,4,power_law_1.2,2.861516761779785
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,7168,2048,8,384,2,4,power_law_1.2,3.7923519134521486
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,384,2,4,power_law_1.01,6.209235382080078
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,7168,2048,8,384,2,4,power_law_1.2,4.4202625274658205
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,7168,2048,8,384,2,4,balanced,8.376229604085287
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,384,2,4,power_law_1.01,9.10412826538086
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,7168,2048,8,384,2,4,power_law_1.2,5.618777465820313
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,384,2,4,power_law_1.01,18.610879516601564
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,7168,2048,8,384,2,4,power_law_1.2,7.804863739013672
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,384,2,4,balanced,8.09391975402832
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,7168,2048,8,384,2,4,power_law_1.2,15.94806365966797
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,7168,2048,8,384,2,4,power_law_1.2,0.08714240193367004
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,7168,2048,8,384,2,4,power_law_1.2,0.12247680425643921
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,7168,2048,8,384,2,4,power_law_1.2,0.10192639827728271
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,7168,2048,8,384,2,4,power_law_1.2,0.12201600074768067
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,7168,2048,8,384,2,4,power_law_1.2,0.17531520128250122
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,7168,2048,8,384,2,4,power_law_1.2,0.23157761096954346
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,7168,2048,8,384,2,4,power_law_1.2,0.2591615915298462
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,7168,2048,8,384,2,4,power_law_1.2,0.3345855951309204
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,7168,2048,8,384,2,4,power_law_1.2,0.3679231882095337
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,7168,2048,8,384,2,4,power_law_1.2,0.3798464059829712
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,7168,2048,8,384,2,4,power_law_1.2,0.39618558883666993
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,7168,2048,8,384,2,4,power_law_1.2,0.4181375980377197
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,7168,2048,8,384,2,4,power_law_1.2,0.4283711910247803
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,384,2,4,balanced,15.882853190104166
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,7168,2048,8,384,2,4,power_law_1.2,0.45505919456481936
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,7168,2048,8,384,2,4,power_law_1.2,0.50316162109375
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,7168,2048,8,384,2,4,power_law_1.2,0.5395328044891358
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,7168,2048,8,384,2,4,power_law_1.2,0.5234047889709472
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,7168,2048,8,384,2,4,power_law_1.2,0.5987648010253906
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,7168,2048,8,384,2,4,power_law_1.2,0.6718272209167481
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,7168,2048,8,384,2,4,power_law_1.2,0.10515199899673462
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,7168,2048,8,384,2,4,power_law_1.2,0.7976448059082031
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,7168,2048,8,384,2,4,power_law_1.2,0.8269503593444825
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,7168,2048,8,384,2,4,power_law_1.2,0.1486143946647644
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,7168,2048,8,384,2,4,power_law_1.2,1.0056447982788086
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,7168,2048,8,384,2,4,power_law_1.2,0.13944319486618043
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,7168,2048,8,384,2,4,power_law_1.2,0.1345023989677429
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,7168,2048,8,384,2,4,power_law_1.2,1.0864831924438476
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,7168,2048,8,384,2,4,power_law_1.2,0.18378880023956298
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,7168,2048,8,384,2,4,power_law_1.2,1.354316806793213
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,7168,2048,8,384,2,4,power_law_1.2,0.26777598857879636
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,7168,2048,8,384,2,4,power_law_1.2,1.7988672256469727
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,7168,2048,8,384,2,4,power_law_1.2,0.26362879276275636
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,7168,2048,8,384,2,4,power_law_1.2,2.4444864273071287
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,7168,2048,8,384,2,4,power_law_1.2,0.3760384082794189
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,7168,2048,8,384,2,4,power_law_1.2,2.9646656036376955
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,7168,2048,8,384,2,4,power_law_1.2,0.38609919548034666
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,7168,2048,8,384,4,2,balanced,0.07091733316580455
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,7168,2048,8,384,2,4,power_law_1.2,0.3918272018432617
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,7168,2048,8,384,2,4,power_law_1.2,3.5438465118408202
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,7168,2048,8,384,4,2,balanced,0.08549867073694865
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,7168,2048,8,384,2,4,power_law_1.2,0.40322561264038087
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,7168,2048,8,384,4,2,balanced,0.12382933497428894
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,7168,2048,8,384,2,4,power_law_1.2,5.960575866699219
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,7168,2048,8,384,2,4,power_law_1.2,0.43288321495056153
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,7168,2048,8,384,4,2,balanced,0.20808533827463785
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,7168,2048,8,384,4,2,balanced,0.373088002204895
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,7168,2048,8,384,2,4,power_law_1.2,0.4528639793395996
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,7168,2048,8,384,2,4,power_law_1.2,11.338003540039063
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,7168,2048,8,384,4,2,balanced,0.6911199887593588
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,7168,2048,8,384,2,4,power_law_1.2,0.5031936168670654
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,7168,2048,8,384,4,2,balanced,1.0248586336771648
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,7168,2048,8,384,2,4,power_law_1.2,0.5546175956726074
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,7168,2048,8,384,4,2,balanced,1.0352266629536946
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,7168,2048,8,384,4,2,balanced,1.033951997756958
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,7168,2048,8,384,2,4,power_law_1.2,0.6173312187194824
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,7168,2048,8,384,4,2,balanced,1.0376319885253906
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,7168,2048,8,384,2,4,power_law_1.2,0.6481919765472413
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,7168,2048,8,384,4,2,balanced,1.0376319885253906
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,7168,2048,8,384,2,4,power_law_1.2,0.819052791595459
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,7168,2048,8,384,4,2,balanced,1.065999984741211
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,7168,2048,8,384,4,2,balanced,1.0877119700113933
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,384,2,4,power_law_1.2,0.873516845703125
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,7168,2048,8,384,4,2,balanced,1.0604746341705322
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,7168,2048,8,384,4,2,balanced,0.057002668579419456
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,7168,2048,8,384,4,2,balanced,1.075653314590454
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,7168,2048,8,384,4,2,balanced,0.06728533407052358
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,7168,2048,8,384,4,2,balanced,1.0817386309305828
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,7168,2048,8,384,4,2,balanced,0.08678399523099263
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,384,2,4,power_law_1.2,0.9176063537597656
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,7168,2048,8,384,4,2,balanced,1.086682637532552
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,7168,2048,8,384,4,2,balanced,0.136954665184021
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,384,2,4,power_law_1.2,1.0960512161254883
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,7168,2048,8,384,4,2,balanced,0.22347732384999594
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,7168,2048,8,384,4,2,balanced,1.1191360155741374
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,7168,2048,8,384,4,2,balanced,0.38944534460703534
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,384,2,4,power_law_1.2,1.4194751739501954
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,7168,2048,8,384,4,2,balanced,1.1603199640909831
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,7168,2048,8,384,4,2,balanced,0.552069346110026
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,384,2,4,power_law_1.2,1.6826816558837892
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,7168,2048,8,384,4,2,balanced,0.5560319821039835
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,7168,2048,8,384,4,2,balanced,1.21670397122701
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,7168,2048,8,384,4,2,balanced,0.5589760144551595
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,384,2,4,power_law_1.2,2.3023487091064454
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,7168,2048,8,384,4,2,balanced,0.5624320109685262
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,7168,2048,8,384,4,2,balanced,1.295466661453247
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,384,2,4,power_law_1.2,2.9429248809814452
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,7168,2048,8,384,4,2,balanced,0.5673653284708658
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,7168,2048,8,384,4,2,balanced,0.576479991277059
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,384,2,4,power_law_1.2,4.1280769348144535
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,7168,2048,8,384,4,2,balanced,1.4058613777160645
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,7168,2048,8,384,4,2,balanced,0.5786186854044596
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,384,2,4,power_law_1.2,5.154444885253906
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,7168,2048,8,384,4,2,balanced,0.5892586708068848
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,7168,2048,8,384,4,2,balanced,0.10126399993896484
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,7168,2048,8,384,4,2,balanced,1.5585066477457683
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,7168,2048,8,384,4,2,balanced,0.6031413475672404
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,7168,2048,8,384,4,2,balanced,0.10963732997576396
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,7168,2048,8,384,4,2,power_law_1.01,0.06577919721603394
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,384,2,4,power_law_1.2,7.604300689697266
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,7168,2048,8,384,4,2,power_law_1.01,0.08636159896850586
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,7168,2048,8,384,4,2,balanced,0.6122613350550333
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,7168,2048,8,384,4,2,balanced,0.12404266993204753
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,7168,2048,8,384,4,2,power_law_1.01,0.08545920252799988
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,7168,2048,8,384,4,2,power_law_1.01,0.12243200540542602
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,7168,2048,8,384,4,2,balanced,0.6330453157424927
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,7168,2048,8,384,4,2,balanced,0.17155200242996216
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,7168,2048,8,384,4,2,balanced,1.7974400520324707
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,7168,2048,8,384,4,2,power_law_1.01,0.1265727996826172
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,384,2,4,power_law_1.2,11.527283477783204
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,7168,2048,8,384,4,2,balanced,0.2501759926478068
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,7168,2048,8,384,4,2,power_law_1.01,0.2014591932296753
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,7168,2048,8,384,4,2,balanced,0.6765013535817465
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,7168,2048,8,384,4,2,power_law_1.01,0.10833280086517334
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,7168,2048,8,384,4,2,balanced,0.425376017888387
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,7168,2048,8,384,4,2,power_law_1.01,0.1512063980102539
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,7168,2048,8,384,4,2,balanced,0.7014613151550293
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,7168,2048,8,384,4,2,power_law_1.01,0.18032000064849854
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,7168,2048,8,384,4,2,balanced,0.6025813420613607
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,384,2,4,power_law_1.2,20.32488250732422
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,7168,2048,8,384,4,2,power_law_1.01,0.2841792106628418
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,7168,2048,8,384,4,2,power_law_1.01,0.24717440605163574
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,7168,2048,8,384,4,2,balanced,0.7632373174031576
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,7168,2048,8,384,4,2,balanced,0.607098658879598
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,7168,2048,8,384,4,2,balanced,2.2671146392822266
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,7168,2048,8,384,4,2,power_law_1.01,0.45023360252380373
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,7168,2048,8,384,4,2,balanced,0.6092319885889689
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,7168,2048,8,384,4,2,power_law_1.01,0.2819648027420044
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,7168,2048,8,384,4,2,balanced,0.8344000180562338
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,7168,2048,8,384,4,2,power_law_1.01,0.4983488082885742
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,7168,2048,8,384,4,2,balanced,0.6156213283538818
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,7168,2048,8,384,4,2,power_law_1.01,0.3743232011795044
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,7168,2048,8,384,4,2,power_law_1.01,0.6513728141784668
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,7168,2048,8,384,4,2,balanced,0.6232586701711019
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,7168,2048,8,384,4,2,power_law_1.01,0.3824383974075317
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,7168,2048,8,384,4,2,balanced,0.9650932947794596
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,7168,2048,8,384,4,2,balanced,0.6323839823404948
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,7168,2048,8,384,4,2,power_law_1.01,0.7000639915466309
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,7168,2048,8,384,4,2,power_law_1.01,0.3931328058242798
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,7168,2048,8,384,4,2,balanced,0.6385493278503418
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,7168,2048,8,384,4,2,power_law_1.01,0.714028787612915
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,7168,2048,8,384,4,2,power_law_1.01,0.41600642204284666
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,7168,2048,8,384,4,2,balanced,2.737936019897461
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,7168,2048,8,384,4,2,balanced,1.1112693150838215
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,7168,2048,8,384,4,2,balanced,0.6521653334299723
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,7168,2048,8,384,4,2,power_law_1.01,0.7516416072845459
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,7168,2048,8,384,4,2,power_law_1.01,0.43807358741760255
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,7168,2048,8,384,4,2,balanced,0.6698933442433676
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,7168,2048,8,384,4,2,power_law_1.01,0.4534656047821045
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,7168,2048,8,384,4,2,power_law_1.01,0.7640255928039551
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,7168,2048,8,384,4,2,balanced,0.6863413651784261
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,7168,2048,8,384,4,2,balanced,1.3608214060465496
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,7168,2048,8,384,4,2,power_law_1.01,0.5056320190429687
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,7168,2048,8,384,4,2,power_law_1.01,0.7840191841125488
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,7168,2048,8,384,4,2,power_law_1.01,0.5388607978820801
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,7168,2048,8,384,4,2,balanced,0.7268640200297037
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,7168,2048,8,384,4,2,power_law_1.01,0.834233570098877
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,7168,2048,8,384,4,2,power_law_1.01,0.542195177078247
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,7168,2048,8,384,4,2,balanced,0.8108159701029459
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,7168,2048,8,384,4,2,power_law_1.01,0.8740096092224121
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,7168,2048,8,384,4,2,power_law_1.01,0.5710976123809814
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,7168,2048,8,384,4,2,power_law_1.01,0.9036352157592773
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,7168,2048,8,384,4,2,balanced,1.7657279968261719
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,7168,2048,8,384,4,2,balanced,3.612362543741862
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,7168,2048,8,384,4,2,power_law_1.01,0.6327680110931396
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,7168,2048,8,384,4,2,power_law_1.01,0.9147071838378906
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,7168,2048,8,384,4,2,power_law_1.01,0.6868800163269043
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,7168,2048,8,384,4,2,power_law_1.01,1.0350655555725097
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,384,4,2,balanced,0.890069325764974
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,7168,2048,8,384,4,2,power_law_1.01,0.8093055725097656
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,7168,2048,8,384,4,2,power_law_1.01,1.113216018676758
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,7168,2048,8,384,4,2,power_law_1.01,0.9040384292602539
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,7168,2048,8,384,4,2,power_law_1.01,1.2817791938781737
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,7168,2048,8,384,4,2,power_law_1.01,1.1016639709472655
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,7168,2048,8,384,4,2,balanced,2.2882506052652993
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,7168,2048,8,384,4,2,power_law_1.01,1.4134271621704102
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,7168,2048,8,384,4,2,power_law_1.01,1.1889599800109862
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,7168,2048,8,384,4,2,power_law_1.01,1.7243648529052735
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,7168,2048,8,384,4,2,power_law_1.01,1.545081615447998
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,384,4,2,balanced,1.0953386624654133
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,7168,2048,8,384,4,2,balanced,4.738304138183594
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,7168,2048,8,384,4,2,power_law_1.01,1.6517824172973632
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,7168,2048,8,384,4,2,power_law_1.01,1.9440767288208007
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,7168,2048,8,384,4,2,power_law_1.01,2.099718475341797
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,384,4,2,balanced,1.2468213240305583
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,7168,2048,8,384,4,2,power_law_1.01,2.6297279357910157
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,7168,2048,8,384,4,2,power_law_1.01,0.10819840431213379
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,7168,2048,8,384,4,2,power_law_1.01,2.6347007751464844
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,7168,2048,8,384,4,2,balanced,3.034677187601725
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,7168,2048,8,384,4,2,power_law_1.01,3.238655853271484
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,7168,2048,8,384,4,2,power_law_1.01,0.12878719568252564
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,384,4,2,balanced,1.4786346753438313
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,7168,2048,8,384,4,2,power_law_1.01,3.4953407287597655
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,7168,2048,8,384,4,2,power_law_1.01,0.17638399600982665
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,7168,2048,8,384,4,2,power_law_1.01,3.956166458129883
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,7168,2048,8,384,4,2,power_law_1.01,0.14672640562057496
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,7168,2048,8,384,4,2,power_law_1.01,4.305171203613281
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,384,4,2,balanced,1.8842986424763997
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,7168,2048,8,384,4,2,power_law_1.01,6.200339126586914
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,7168,2048,8,384,4,2,power_law_1.01,0.21393918991088867
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,7168,2048,8,384,4,2,power_law_1.01,5.3374591827392575
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,7168,2048,8,384,4,2,power_law_1.01,0.28330240249633787
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,7168,2048,8,384,4,2,power_law_1.01,11.954649353027344
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,7168,2048,8,384,4,2,power_law_1.01,0.32835841178894043
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,7168,2048,8,384,4,2,power_law_1.01,7.546099090576172
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,384,4,2,balanced,2.3924694061279297
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,7168,2048,8,384,4,2,power_law_1.01,0.3981568098068237
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,7168,2048,8,384,4,2,power_law_1.01,0.43349761962890626
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,7168,2048,8,384,4,2,balanced,3.848853429158529
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,7168,2048,8,384,4,2,power_law_1.01,15.193331909179687
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,7168,2048,8,384,4,2,power_law_1.01,0.4539072036743164
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,7168,2048,8,384,4,2,balanced,7.033866882324219
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,384,4,2,balanced,3.414496103922526
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,7168,2048,8,384,4,2,power_law_1.01,0.4720320224761963
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,7168,2048,8,384,4,2,power_law_1.01,0.5069503784179688
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,7168,2048,8,384,4,2,power_law_1.01,0.5355519771575927
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,7168,2048,8,384,4,2,power_law_1.01,0.5661824226379395
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,7168,2048,8,384,4,2,power_law_1.01,0.6056575775146484
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,384,4,2,balanced,4.515125274658203
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,7168,2048,8,384,4,2,power_law_1.2,0.08627200126647949
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,7168,2048,8,384,4,2,power_law_1.01,0.6328896045684814
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,7168,2048,8,384,4,2,power_law_1.2,0.12128640413284301
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,7168,2048,8,384,4,2,power_law_1.01,0.7510144233703613
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,7168,2048,8,384,4,2,power_law_1.2,0.1302783966064453
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,7168,2048,8,384,4,2,power_law_1.2,0.1514623999595642
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,7168,2048,8,384,4,2,power_law_1.01,0.9054335594177246
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,7168,2048,8,384,4,2,power_law_1.2,0.2614527940750122
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,7168,2048,8,384,4,2,balanced,5.805877049763997
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,7168,2048,8,384,4,2,power_law_1.2,0.3620352029800415
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,7168,2048,8,384,4,2,power_law_1.2,0.4760000228881836
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,384,4,2,power_law_1.01,0.9643903732299804
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,7168,2048,8,384,4,2,power_law_1.2,0.6029632091522217
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,384,4,2,balanced,6.218208312988281
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,7168,2048,8,384,4,2,power_law_1.2,0.6665855884552002
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,7168,2048,8,384,4,2,power_law_1.2,0.690880012512207
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,384,4,2,power_law_1.01,1.1305279731750488
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,7168,2048,8,384,4,2,power_law_1.2,0.7311103820800782
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,7168,2048,8,384,4,2,power_law_1.2,0.7755904197692871
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,384,4,2,power_law_1.01,1.289625644683838
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,7168,2048,8,384,4,2,power_law_1.2,0.7961535930633545
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,384,4,2,power_law_1.01,1.7926847457885742
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,7168,2048,8,384,4,2,power_law_1.2,0.8315711975097656
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,384,4,2,power_law_1.01,2.0292991638183593
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,7168,2048,8,384,4,2,power_law_1.2,0.8787839889526368
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,7168,2048,8,384,4,2,power_law_1.2,0.9042048454284668
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,384,4,2,power_law_1.01,2.8825023651123045
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,7168,2048,8,384,4,2,power_law_1.2,0.9427071571350097
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,384,4,2,power_law_1.01,3.624313735961914
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,7168,2048,8,384,4,2,power_law_1.2,1.063276767730713
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,384,4,2,balanced,7.784677505493164
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,7168,2048,8,384,4,2,power_law_1.2,1.1508480072021485
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,384,4,2,power_law_1.01,5.191219329833984
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,7168,2048,8,384,4,2,power_law_1.2,1.3487232208251954
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,7168,2048,8,384,4,2,power_law_1.2,1.4922816276550293
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,384,4,2,power_law_1.01,6.566886138916016
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,7168,2048,8,384,4,2,balanced,13.009482065836588
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,7168,2048,8,384,4,2,power_law_1.2,1.9096832275390625
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,384,4,2,power_law_1.01,8.239730834960938
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,7168,2048,8,384,4,2,power_law_1.2,1.7033855438232421
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,7168,2048,8,384,4,2,power_law_1.2,2.145542335510254
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,384,4,2,power_law_1.01,12.897113037109374
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,7168,2048,8,384,4,2,power_law_1.2,2.7561344146728515
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,7168,2048,8,384,4,2,power_law_1.2,3.76940803527832
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,7168,2048,8,384,4,2,power_law_1.2,4.377766418457031
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,384,4,2,power_law_1.01,25.45888671875
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,7168,2048,8,384,4,2,power_law_1.2,5.545087814331055
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,7168,2048,8,384,4,2,power_law_1.2,8.194099426269531
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,7168,2048,8,384,4,2,power_law_1.2,0.06621440052986145
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,7168,2048,8,384,4,2,balanced,10.842992146809896
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,384,4,2,balanced,12.24306615193685
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,7168,2048,8,384,4,2,power_law_1.2,0.08541439771652222
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,7168,2048,8,384,4,2,power_law_1.2,15.382144165039062
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,7168,2048,8,384,4,2,power_law_1.2,0.09160320162773132
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,7168,2048,8,384,4,2,power_law_1.2,0.11150720119476318
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,7168,2048,8,384,4,2,power_law_1.2,0.160588800907135
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,7168,2048,8,384,4,2,power_law_1.2,0.22033278942108153
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,7168,2048,8,384,4,2,power_law_1.2,0.2620928049087524
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,7168,2048,8,384,4,2,power_law_1.2,0.35928959846496583
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,7168,2048,8,384,4,2,power_law_1.2,0.37394559383392334
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,7168,2048,8,384,4,2,power_law_1.2,0.3859519958496094
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,7168,2048,8,384,4,2,power_law_1.2,0.4074687957763672
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,7168,2048,8,384,4,2,power_law_1.2,0.43116159439086915
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,7168,2048,8,384,4,2,power_law_1.2,0.45459837913513185
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,7168,2048,8,384,4,2,power_law_1.2,0.49356799125671386
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,7168,2048,8,384,4,2,power_law_1.2,0.5185152053833008
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,7168,2048,8,384,4,2,power_law_1.2,0.5678271770477294
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,7168,2048,8,384,4,2,power_law_1.2,0.576793622970581
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,7168,2048,8,384,4,2,power_law_1.2,0.6636735916137695
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,7168,2048,8,384,4,2,power_law_1.2,0.6895743846893311
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,7168,2048,8,384,4,2,power_law_1.2,0.8412927627563477
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,7168,2048,8,384,4,2,power_law_1.2,0.906879997253418
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,7168,2048,8,384,4,2,power_law_1.2,1.1567232131958007
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,384,4,2,balanced,24.317642211914062
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,7168,2048,8,384,4,2,power_law_1.2,1.2600704193115235
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,7168,2048,8,384,4,2,power_law_1.2,1.6653120040893554
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,7168,2048,8,384,4,2,power_law_1.2,2.021881675720215
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,7168,2048,8,384,4,2,power_law_1.2,2.7823104858398438
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,7168,2048,8,384,4,2,power_law_1.2,3.2681278228759765
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,7168,2048,8,384,4,2,power_law_1.2,4.236787033081055
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,7168,2048,8,384,8,1,balanced,0.073594664533933
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,7168,2048,8,384,4,2,power_law_1.2,6.3820030212402346
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,7168,2048,8,384,8,1,balanced,0.08995200196901958
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,7168,2048,8,384,4,2,power_law_1.2,0.10890239477157593
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,7168,2048,8,384,8,1,balanced,0.13249066472053528
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,7168,2048,8,384,4,2,power_law_1.2,12.993203735351562
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,7168,2048,8,384,8,1,balanced,0.2201546629269918
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,7168,2048,8,384,4,2,power_law_1.2,0.1295807957649231
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,7168,2048,8,384,8,1,balanced,0.3973333438237508
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,7168,2048,8,384,4,2,power_law_1.2,0.14730240106582643
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,7168,2048,8,384,8,1,balanced,0.7230559984842936
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,7168,2048,8,384,4,2,power_law_1.2,0.15005439519882202
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,7168,2048,8,384,8,1,balanced,1.060144027074178
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,7168,2048,8,384,4,2,power_law_1.2,0.195360004901886
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,7168,2048,8,384,8,1,balanced,1.0608320236206055
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,7168,2048,8,384,4,2,power_law_1.2,0.2657088041305542
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,7168,2048,8,384,8,1,balanced,1.0621973673502605
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,7168,2048,8,384,4,2,power_law_1.2,0.295142388343811
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,7168,2048,8,384,8,1,balanced,1.0718986988067627
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,7168,2048,8,384,4,2,power_law_1.2,0.40123519897460935
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,7168,2048,8,384,8,1,balanced,1.0801706314086914
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,7168,2048,8,384,4,2,power_law_1.2,0.42704000473022463
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,7168,2048,8,384,8,1,balanced,1.090714693069458
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,7168,2048,8,384,8,1,balanced,1.1080426375071208
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,7168,2048,8,384,4,2,power_law_1.2,0.4331200122833252
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,7168,2048,8,384,8,1,balanced,1.1160319646199544
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,7168,2048,8,384,4,2,power_law_1.2,0.4659008026123047
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,7168,2048,8,384,8,1,balanced,1.1207839647928874
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,7168,2048,8,384,4,2,power_law_1.2,0.4958399772644043
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,7168,2048,8,384,8,1,balanced,1.1344853242238362
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,7168,2048,8,384,4,2,power_law_1.2,0.5214784145355225
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,7168,2048,8,384,8,1,balanced,1.1370773315429688
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,7168,2048,8,384,4,2,power_law_1.2,0.5691967964172363
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,7168,2048,8,384,4,2,power_law_1.2,0.5982272148132324
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,7168,2048,8,384,8,1,balanced,1.1860106786092122
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,7168,2048,8,384,4,2,power_law_1.2,0.6528768062591552
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,7168,2048,8,384,8,1,balanced,1.2568480173746746
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,7168,2048,8,384,4,2,power_law_1.2,0.7327167987823486
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,7168,2048,8,384,8,1,balanced,1.3622506459554036
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,7168,2048,8,384,4,2,power_law_1.2,0.9487039566040039
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,7168,2048,8,384,8,1,balanced,1.508885383605957
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,384,4,2,power_law_1.2,0.9877440452575683
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,7168,2048,8,384,8,1,balanced,1.6974666913350422
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,7168,2048,8,384,8,1,balanced,0.06275733311971028
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,384,4,2,power_law_1.2,1.187820816040039
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,7168,2048,8,384,8,1,balanced,0.07286400099595387
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,7168,2048,8,384,8,1,balanced,1.9486400286356609
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,7168,2048,8,384,8,1,balanced,0.0969493289788564
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,384,4,2,power_law_1.2,1.3270336151123048
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,7168,2048,8,384,8,1,balanced,0.1500746707121531
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,384,4,2,power_law_1.2,1.8468288421630858
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,7168,2048,8,384,8,1,balanced,0.2476266622543335
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,7168,2048,8,384,8,1,balanced,0.4452693462371826
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,384,4,2,power_law_1.2,2.2198463439941407
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,7168,2048,8,384,8,1,balanced,2.373535950978597
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,7168,2048,8,384,8,1,balanced,0.6379679838816324
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,384,4,2,power_law_1.2,2.819385528564453
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,7168,2048,8,384,8,1,balanced,0.6457440058390299
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,7168,2048,8,384,8,1,balanced,0.6497493187586466
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,384,4,2,power_law_1.2,3.8524097442626952
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,7168,2048,8,384,8,1,balanced,0.6529706716537476
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,7168,2048,8,384,8,1,balanced,0.6627839803695679
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,384,4,2,power_law_1.2,5.241337585449219
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,7168,2048,8,384,8,1,balanced,3.0442186991373696
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,7168,2048,8,384,8,1,balanced,0.677669366200765
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,384,4,2,power_law_1.2,6.888729858398437
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,7168,2048,8,384,8,1,balanced,0.6829173564910889
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,7168,2048,8,384,8,1,balanced,0.7077866395314535
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,384,4,2,power_law_1.2,8.608006286621094
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,7168,2048,8,384,8,1,balanced,0.16364266475041708
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,7168,2048,8,384,8,1,balanced,0.7237706979115804
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,7168,2048,8,384,8,1,balanced,0.17463467518488565
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,7168,2048,8,384,8,1,balanced,0.7450133164723715
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,384,4,2,power_law_1.2,13.829740905761719
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,7168,2048,8,384,8,1,balanced,3.9310452143351235
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,7168,2048,8,384,8,1,balanced,0.19218667348225912
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,7168,2048,8,384,8,1,balanced,0.7733973662058512
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,7168,2048,8,384,8,1,balanced,0.24065599838892618
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,7168,2048,8,384,8,1,power_law_1.01,0.06876800060272217
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,7168,2048,8,384,8,1,balanced,0.8345332940419515
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,7168,2048,8,384,8,1,balanced,0.33745066324869794
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,7168,2048,8,384,8,1,power_law_1.01,0.05764480233192444
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,7168,2048,8,384,8,1,power_law_1.01,0.08483200073242188
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,384,4,2,power_law_1.2,27.048858642578125
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,7168,2048,8,384,8,1,balanced,0.526533325513204
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,7168,2048,8,384,8,1,balanced,0.860373338063558
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,7168,2048,8,384,8,1,power_law_1.01,0.06888960003852844
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,7168,2048,8,384,8,1,power_law_1.01,0.13057279586791992
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,7168,2048,8,384,8,1,balanced,0.7358079751332601
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,7168,2048,8,384,8,1,power_law_1.01,0.093612802028656
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,7168,2048,8,384,8,1,balanced,0.9589227040608724
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,7168,2048,8,384,8,1,power_law_1.01,0.166048002243042
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,7168,2048,8,384,8,1,balanced,0.7383786837259928
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,7168,2048,8,384,8,1,power_law_1.01,0.11793919801712036
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,7168,2048,8,384,8,1,balanced,0.7540480295817057
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,7168,2048,8,384,8,1,power_law_1.01,0.3001215934753418
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,7168,2048,8,384,8,1,balanced,1.097551981608073
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,7168,2048,8,384,8,1,balanced,5.040677388509114
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,7168,2048,8,384,8,1,power_law_1.01,0.1906175971031189
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,7168,2048,8,384,8,1,balanced,0.7681919733683268
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,7168,2048,8,384,8,1,power_law_1.01,0.4566336154937744
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,7168,2048,8,384,8,1,power_law_1.01,0.270796799659729
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,7168,2048,8,384,8,1,balanced,0.7775786717732748
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,7168,2048,8,384,8,1,power_law_1.01,0.5084095954895019
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,7168,2048,8,384,8,1,balanced,1.2535040378570557
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,7168,2048,8,384,8,1,balanced,0.7909599939982096
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,7168,2048,8,384,8,1,power_law_1.01,0.3247936010360718
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,7168,2048,8,384,8,1,power_law_1.01,0.6581696033477783
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,7168,2048,8,384,8,1,balanced,0.8097226619720459
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,7168,2048,8,384,8,1,power_law_1.01,0.40962557792663573
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,7168,2048,8,384,8,1,power_law_1.01,0.7028736114501953
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,7168,2048,8,384,8,1,balanced,1.490239938100179
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,7168,2048,8,384,8,1,balanced,0.8343786398569742
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,7168,2048,8,384,8,1,power_law_1.01,0.4397119998931885
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,7168,2048,8,384,8,1,power_law_1.01,0.7436736106872559
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,7168,2048,8,384,8,1,balanced,0.874293327331543
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,7168,2048,8,384,8,1,power_law_1.01,0.45198721885681153
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,7168,2048,8,384,8,1,power_law_1.01,0.7657983779907227
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,7168,2048,8,384,8,1,balanced,0.9096480210622152
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,7168,2048,8,384,8,1,power_law_1.01,0.8155391693115235
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,7168,2048,8,384,8,1,balanced,1.9250292778015137
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,7168,2048,8,384,8,1,power_law_1.01,0.48383359909057616
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,7168,2048,8,384,8,1,balanced,0.9795467058817545
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,7168,2048,8,384,8,1,balanced,6.368837356567383
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,7168,2048,8,384,8,1,power_law_1.01,0.8554688453674316
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,7168,2048,8,384,8,1,power_law_1.01,0.5055295944213867
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,7168,2048,8,384,8,1,balanced,1.1022720336914062
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,7168,2048,8,384,8,1,power_law_1.01,0.9158464431762695
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,7168,2048,8,384,8,1,power_law_1.01,0.5392831802368164
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,7168,2048,8,384,8,1,power_law_1.01,0.9572159767150878
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,7168,2048,8,384,8,1,power_law_1.01,0.5682432174682617
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,7168,2048,8,384,8,1,balanced,2.52948792775472
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,7168,2048,8,384,8,1,power_law_1.01,0.9958975791931153
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,7168,2048,8,384,8,1,power_law_1.01,0.6171199798583984
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,7168,2048,8,384,8,1,power_law_1.01,1.0033023834228516
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,7168,2048,8,384,8,1,power_law_1.01,0.6487872123718261
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,384,8,1,balanced,1.285919984181722
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,7168,2048,8,384,8,1,power_law_1.01,0.14206720590591432
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,7168,2048,8,384,8,1,power_law_1.01,0.6694591999053955
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,7168,2048,8,384,8,1,power_law_1.01,1.1506688117980957
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,7168,2048,8,384,8,1,power_law_1.01,0.7523839950561524
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,7168,2048,8,384,8,1,power_law_1.01,0.1537600040435791
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,7168,2048,8,384,8,1,power_law_1.01,1.2323583602905273
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,7168,2048,8,384,8,1,power_law_1.01,0.18415360450744628
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,7168,2048,8,384,8,1,power_law_1.01,0.8614912033081055
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,7168,2048,8,384,8,1,power_law_1.01,1.465062427520752
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,7168,2048,8,384,8,1,power_law_1.01,0.21286399364471437
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,7168,2048,8,384,8,1,balanced,3.4596640268961587
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,7168,2048,8,384,8,1,power_law_1.01,1.0497471809387207
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,7168,2048,8,384,8,1,power_law_1.01,1.6188671112060546
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,7168,2048,8,384,8,1,power_law_1.01,0.2748863935470581
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,7168,2048,8,384,8,1,power_law_1.01,0.35248000621795655
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,7168,2048,8,384,8,1,power_law_1.01,1.1000831604003907
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,384,8,1,balanced,1.6698773701985676
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,7168,2048,8,384,8,1,power_law_1.01,1.9556159973144531
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,7168,2048,8,384,8,1,power_law_1.01,0.41356801986694336
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,7168,2048,8,384,8,1,power_law_1.01,1.36561279296875
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,7168,2048,8,384,8,1,power_law_1.01,2.0062143325805666
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,7168,2048,8,384,8,1,power_law_1.01,0.5123712062835694
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,7168,2048,8,384,8,1,balanced,9.63851229349772
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,384,8,1,balanced,1.9466613133748372
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,7168,2048,8,384,8,1,power_law_1.01,1.5319744110107423
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,7168,2048,8,384,8,1,power_law_1.01,0.5394432067871093
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,7168,2048,8,384,8,1,power_law_1.01,2.5664512634277346
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,7168,2048,8,384,8,1,power_law_1.01,0.5618559837341308
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,7168,2048,8,384,8,1,power_law_1.01,2.012249565124512
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,7168,2048,8,384,8,1,power_law_1.01,0.5889664173126221
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,7168,2048,8,384,8,1,power_law_1.01,3.64400634765625
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,384,8,1,balanced,2.340181350708008
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,7168,2048,8,384,8,1,power_law_1.01,2.7751232147216798
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,7168,2048,8,384,8,1,power_law_1.01,0.6201280117034912
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,7168,2048,8,384,8,1,power_law_1.2,0.0689087986946106
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,7168,2048,8,384,8,1,balanced,4.362858772277832
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,7168,2048,8,384,8,1,power_law_1.01,4.878291320800781
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,7168,2048,8,384,8,1,power_law_1.01,0.6673408031463623
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,7168,2048,8,384,8,1,power_law_1.01,3.8390079498291017
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,7168,2048,8,384,8,1,power_law_1.2,0.08540800213813782
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,384,8,1,balanced,3.1170078913370767
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,7168,2048,8,384,8,1,power_law_1.01,0.747372817993164
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,7168,2048,8,384,8,1,power_law_1.01,5.224473571777343
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,7168,2048,8,384,8,1,power_law_1.01,4.442841720581055
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,7168,2048,8,384,8,1,power_law_1.01,0.8165696144104004
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,7168,2048,8,384,8,1,power_law_1.2,0.10932480096817017
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,7168,2048,8,384,8,1,power_law_1.01,0.8744000434875489
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,7168,2048,8,384,8,1,power_law_1.01,6.309388732910156
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,7168,2048,8,384,8,1,power_law_1.2,0.1695680022239685
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,7168,2048,8,384,8,1,power_law_1.01,5.4154304504394535
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,7168,2048,8,384,8,1,power_law_1.01,1.0091327667236327
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,384,8,1,balanced,4.041376113891602
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,7168,2048,8,384,8,1,power_law_1.2,0.2734208106994629
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,7168,2048,8,384,8,1,power_law_1.01,1.2444031715393067
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,7168,2048,8,384,8,1,power_law_1.01,9.559616088867188
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,7168,2048,8,384,8,1,power_law_1.01,8.48927993774414
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,7168,2048,8,384,8,1,power_law_1.2,0.369868803024292
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,7168,2048,8,384,8,1,power_law_1.2,0.4713727951049805
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,384,8,1,power_law_1.01,1.375436782836914
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,7168,2048,8,384,8,1,power_law_1.01,19.872940063476562
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,7168,2048,8,384,8,1,power_law_1.2,0.6385087966918945
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,7168,2048,8,384,8,1,power_law_1.01,17.511085510253906
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,7168,2048,8,384,8,1,balanced,5.5061601003011065
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,384,8,1,balanced,5.896783828735352
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,7168,2048,8,384,8,1,power_law_1.2,0.6731520175933838
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,384,8,1,power_law_1.01,1.6441600799560547
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,7168,2048,8,384,8,1,power_law_1.2,0.7151552200317383
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,384,8,1,power_law_1.01,1.985625648498535
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,7168,2048,8,384,8,1,power_law_1.2,0.7480959892272949
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,384,8,1,power_law_1.01,2.6303552627563476
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,7168,2048,8,384,8,1,power_law_1.2,0.8024383544921875
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,384,8,1,power_law_1.01,3.2072769165039063
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,7168,2048,8,384,8,1,power_law_1.2,0.8487360000610351
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,384,8,1,power_law_1.01,4.424121475219726
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,384,8,1,balanced,7.888336181640625
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,7168,2048,8,384,8,1,power_law_1.2,0.9086144447326661
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,384,8,1,power_law_1.01,5.656268692016601
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,7168,2048,8,384,8,1,power_law_1.2,0.9404735565185547
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,384,8,1,power_law_1.01,8.12250213623047
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,7168,2048,8,384,8,1,power_law_1.2,0.9811136245727539
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,384,8,1,power_law_1.01,10.581011199951172
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,7168,2048,8,384,8,1,power_law_1.2,1.0244735717773437
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,7168,2048,8,384,8,1,power_law_1.2,1.1598591804504395
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,384,8,1,power_law_1.01,13.051846313476563
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,7168,2048,8,384,8,1,balanced,18.085248311360676
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,7168,2048,8,384,8,1,power_law_1.2,1.2836352348327638
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,7168,2048,8,384,8,1,power_law_1.2,1.4888895988464355
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,384,8,1,balanced,10.689685821533203
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,7168,2048,8,384,8,1,balanced,8.406623840332031
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,384,8,1,power_law_1.01,20.425657653808592
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,7168,2048,8,384,8,1,power_law_1.2,1.6377727508544921
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,7168,2048,8,384,8,1,power_law_1.2,2.0078079223632814
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,7168,2048,8,384,8,1,power_law_1.2,2.0931711196899414
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,384,8,1,power_law_1.01,40.1673095703125
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,7168,2048,8,384,8,1,power_law_1.2,2.638041687011719
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,7168,2048,8,384,8,1,power_law_1.2,3.826067352294922
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,7168,2048,8,384,8,1,power_law_1.2,5.097439956665039
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,384,8,1,balanced,13.288618723551432
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,7168,2048,8,384,8,1,power_law_1.2,5.3447105407714846
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,7168,2048,8,384,8,1,power_law_1.2,6.3984638214111325
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,7168,2048,8,384,8,1,power_law_1.2,9.705881500244141
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,7168,2048,8,384,8,1,power_law_1.2,20.29469451904297
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,7168,2048,8,384,8,1,power_law_1.2,0.058348798751831056
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,7168,2048,8,384,8,1,power_law_1.2,0.06908159852027893
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,384,8,1,balanced,20.8101069132487
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,7168,2048,8,384,8,1,power_law_1.2,0.0818880021572113
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,7168,2048,8,384,8,1,power_law_1.2,0.11678719520568848
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,7168,2048,8,384,8,1,balanced,16.208101908365887
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,7168,2048,8,384,8,1,power_law_1.2,0.17052799463272095
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,7168,2048,8,384,8,1,power_law_1.2,0.24106240272521973
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,7168,2048,8,384,8,1,power_law_1.2,0.288588809967041
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,7168,2048,8,384,8,1,power_law_1.2,0.3862783908843994
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,7168,2048,8,384,8,1,power_law_1.2,0.41831040382385254
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,7168,2048,8,384,8,1,power_law_1.2,0.44355201721191406
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,7168,2048,8,384,8,1,power_law_1.2,0.4605440139770508
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,7168,2048,8,384,8,1,power_law_1.2,0.5114048004150391
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,7168,2048,8,384,8,1,power_law_1.2,0.5301695823669433
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,7168,2048,8,384,8,1,power_law_1.2,0.5682496070861817
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,7168,2048,8,384,8,1,power_law_1.2,0.6180607795715332
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,7168,2048,8,384,8,1,power_law_1.2,0.6417151927947998
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,7168,2048,8,384,8,1,power_law_1.2,0.6768256187438965
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,7168,2048,8,384,8,1,power_law_1.2,0.7667840003967286
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,7168,2048,8,384,8,1,power_law_1.2,0.8656767845153809
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,7168,2048,8,384,8,1,power_law_1.2,1.058899211883545
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,7168,2048,8,384,8,1,power_law_1.2,1.1286335945129395
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,7168,2048,8,384,8,1,power_law_1.2,1.432096004486084
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,7168,2048,8,384,8,1,power_law_1.2,1.6085311889648437
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,384,8,1,balanced,40.912068684895836
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,7168,2048,8,384,8,1,power_law_1.2,2.0893375396728517
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,7168,2048,8,384,8,1,power_law_1.2,2.906355285644531
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,7168,2048,8,384,8,1,power_law_1.2,3.9576190948486327
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,128,1,8,balanced,0.0580320010582606
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,128,1,8,balanced,0.06267199913660686
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,7168,2048,8,384,8,1,power_law_1.2,4.499776077270508
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,128,1,8,balanced,0.06923733154932658
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,7168,2048,8,384,8,1,power_law_1.2,5.461907196044922
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,128,1,8,balanced,0.07566933333873749
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,128,1,8,balanced,0.0893440047899882
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,7168,2048,8,384,8,1,power_law_1.2,8.58929901123047
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,128,1,8,balanced,0.11567999919255574
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,128,1,8,balanced,0.11690133810043335
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,7168,2048,8,384,8,1,power_law_1.2,0.1416383981704712
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,128,1,8,balanced,0.11733333269755046
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,7168,2048,8,384,8,1,power_law_1.2,17.967776489257812
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,7168,2048,8,384,8,1,power_law_1.2,0.1536512017250061
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,128,1,8,balanced,0.12223466237386067
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,7168,2048,8,384,8,1,power_law_1.2,0.17995519638061525
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,128,1,8,balanced,0.12308800220489502
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,7168,2048,8,384,8,1,power_law_1.2,0.2118527889251709
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,128,1,8,balanced,0.12353066603342693
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,7168,2048,8,384,8,1,power_law_1.2,0.26635520458221434
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,128,1,8,balanced,0.16380799810091654
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,128,1,8,power_law_1.01,0.10158079862594604
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,128,1,8,balanced,0.1625493367513021
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,7168,2048,8,384,8,1,power_law_1.2,0.32356479167938235
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,128,1,8,power_law_1.01,0.12611199617385865
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,128,1,8,balanced,0.16296000281969705
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,7168,2048,8,384,8,1,power_law_1.2,0.3717184066772461
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,128,1,8,power_law_1.01,0.08620160222053527
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,128,1,8,balanced,0.2887413303057353
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,128,1,8,power_law_1.2,0.10211199522018433
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,128,1,8,power_law_1.01,0.07624959945678711
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,7168,2048,8,384,8,1,power_law_1.2,0.4900032043457031
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,128,1,8,power_law_1.01,0.08316159844398499
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,128,1,8,balanced,0.2906186580657959
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,7168,2048,8,384,8,1,power_law_1.2,0.5182720184326172
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,128,1,8,power_law_1.2,0.11776000261306763
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,128,1,8,power_law_1.01,0.09230080246925354
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,128,1,8,balanced,0.2911733388900757
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,128,1,8,power_law_1.01,0.10853760242462158
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,128,1,8,power_law_1.2,0.08229119777679443
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,7168,2048,8,384,8,1,power_law_1.2,0.5442368030548096
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,128,1,8,power_law_1.01,0.11139199733734131
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,128,1,8,balanced,0.294650673866272
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,128,1,8,power_law_1.2,0.07750399708747864
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,128,1,8,power_law_1.01,0.11338239908218384
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,7168,2048,8,384,8,1,power_law_1.2,0.5812479972839355
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,128,1,8,power_law_1.01,0.11582080125808716
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,128,1,8,balanced,0.29708800713221234
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,128,1,8,power_law_1.2,0.08340479731559754
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,7168,2048,8,384,8,1,power_law_1.2,0.6371071815490723
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,128,1,8,power_law_1.01,0.11314560174942016
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,128,1,8,power_law_1.01,0.1550271987915039
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,128,1,8,power_law_1.2,0.0945472002029419
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,128,1,8,balanced,0.303765336672465
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,7168,2048,8,384,8,1,power_law_1.2,0.6591040134429932
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,128,1,8,power_law_1.01,0.16075520515441893
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,128,1,8,power_law_1.2,0.10179200172424316
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,128,1,8,power_law_1.01,0.1546560049057007
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,7168,2048,8,384,8,1,power_law_1.2,0.7382912158966064
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,128,1,8,balanced,0.3129546642303467
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,128,1,8,power_law_1.01,0.29066240787506104
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,128,1,8,power_law_1.2,0.10552959442138672
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,7168,2048,8,384,8,1,power_law_1.2,0.817632007598877
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,128,1,8,power_law_1.01,0.292576003074646
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,128,1,8,balanced,0.33504533767700195
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,128,1,8,power_law_1.2,0.11019519567489625
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,128,1,8,power_law_1.01,0.2879103899002075
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,7168,2048,8,384,8,1,power_law_1.2,0.8801919937133789
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,128,1,8,power_law_1.01,0.3243583917617798
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,128,2,4,balanced,0.046906664967536926
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,128,1,8,power_law_1.2,0.11256320476531982
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,128,1,8,power_law_1.01,0.3696768045425415
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,7168,2048,8,384,8,1,power_law_1.2,0.996127986907959
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,128,1,8,balanced,0.3587786753972371
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,128,1,8,power_law_1.2,0.11567360162734985
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,128,2,4,balanced,0.052928000688552856
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,128,1,8,power_law_1.01,0.38586881160736086
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,7168,2048,8,384,8,1,power_law_1.2,1.2561344146728515
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,128,1,8,power_law_1.01,0.45566720962524415
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,128,2,4,balanced,0.05453866720199585
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,128,1,8,power_law_1.2,0.1635200023651123
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,128,1,8,balanced,0.6354613304138184
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,128,1,8,power_law_1.01,0.551859188079834
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,128,2,4,balanced,0.07057066758473714
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,128,1,8,power_law_1.01,0.6607423782348633
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,128,1,8,power_law_1.2,0.15788160562515258
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,128,1,8,power_law_1.01,0.9551039695739746
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,128,2,4,balanced,0.08290666838486989
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,384,8,1,power_law_1.2,1.3952256202697755
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,128,1,8,power_law_1.2,0.16320639848709106
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,128,1,8,power_law_1.01,1.2500351905822753
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,128,1,8,balanced,0.6787253220876058
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,128,2,4,balanced,0.10991467038790385
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,128,1,8,power_law_1.01,1.5155712127685548
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,128,1,8,power_law_1.2,0.2811840057373047
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,128,2,4,balanced,0.11038399736086528
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,128,1,8,power_law_1.01,2.1494144439697265
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,128,1,8,power_law_1.2,0.30342400074005127
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,384,8,1,power_law_1.2,1.676595115661621
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,128,2,4,balanced,0.111135999361674
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,128,1,8,power_law_1.01,2.928326416015625
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,128,1,8,power_law_1.2,0.30385921001434324
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,128,1,8,balanced,0.9990453720092773
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,128,2,4,power_law_1.01,0.07034239768981934
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,128,2,4,balanced,0.11089600125948589
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,384,8,1,power_law_1.2,2.0060415267944336
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,128,1,8,power_law_1.01,3.930329513549805
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,128,1,8,power_law_1.2,0.348089599609375
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,128,2,4,balanced,0.11146666606267293
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,128,2,4,power_law_1.01,0.08938239812850952
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,128,1,8,power_law_1.01,7.93135986328125
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,384,8,1,power_law_1.2,2.6589824676513674
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,128,1,8,power_law_1.2,0.36728320121765134
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,128,2,4,balanced,0.11191466450691223
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,128,2,4,power_law_1.01,0.08005120158195496
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,384,8,1,power_law_1.2,3.2579391479492186
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,128,2,4,balanced,0.1267093320687612
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,128,1,8,power_law_1.2,0.45477118492126467
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,128,2,4,power_law_1.01,0.07407360076904297
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,128,1,8,balanced,1.3206506570180256
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,128,2,4,balanced,0.12609066565831503
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,128,2,4,power_law_1.01,0.08106240034103393
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,384,8,1,power_law_1.2,4.501855850219727
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,128,1,8,power_law_1.2,0.4836160182952881
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,128,2,4,balanced,0.12692266702651978
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,128,2,4,power_law_1.01,0.08229759931564332
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,128,1,8,power_law_1.2,0.6153408050537109
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,384,8,1,power_law_1.2,5.7274433135986325
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,128,2,4,balanced,0.15784000356992087
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,128,2,4,power_law_1.01,0.09157119989395142
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,128,1,8,power_law_1.2,0.7567103862762451
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,128,2,4,balanced,0.15964266657829285
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,128,2,4,power_law_1.01,0.09667199850082397
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,384,8,1,power_law_1.2,8.216345977783202
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,128,1,8,power_law_1.2,1.209119987487793
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,128,2,4,balanced,0.15957333644231161
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,128,1,8,balanced,1.63754669825236
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,128,2,4,power_law_1.01,0.10118399858474732
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,128,1,8,power_law_1.2,1.500979232788086
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,128,2,4,balanced,0.31011199951171875
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,128,2,4,power_law_1.01,0.10652159452438355
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,384,8,1,power_law_1.2,10.648115539550782
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,128,2,4,power_law_1.01,0.10830080509185791
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,128,1,8,power_law_1.2,1.987718391418457
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,128,2,4,balanced,0.3126613299051921
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,384,8,1,power_law_1.2,13.102720642089844
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,128,2,4,power_law_1.01,0.11363840103149414
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,128,1,8,power_law_1.2,2.776678466796875
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,128,2,4,balanced,0.32077866792678833
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,128,2,4,power_law_1.01,0.11778559684753417
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,128,1,8,power_law_1.2,3.4106048583984374
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,128,2,4,balanced,0.3274453282356262
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,128,2,4,power_law_1.01,0.12492799758911133
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,384,8,1,power_law_1.2,20.504173278808594
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,128,2,4,power_law_1.01,0.1598528027534485
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,128,1,8,balanced,2.60536527633667
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,128,1,8,power_law_1.2,4.981222534179688
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,128,2,4,balanced,0.34938665231068927
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,128,2,4,power_law_1.01,0.16341760158538818
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,128,1,8,power_law_1.2,11.686752319335938
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,128,2,4,power_law_1.01,0.1749567985534668
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,128,2,4,balanced,0.37057065963745117
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,384,8,1,power_law_1.2,40.194522094726565
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,128,2,4,power_law_1.01,0.3230079889297485
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,128,2,4,balanced,0.6604799826939901
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,128,2,4,power_law_1.01,0.3446208000183105
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,128,2,4,power_law_1.01,0.39502720832824706
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,128,2,4,power_law_1.01,0.43340158462524414
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,128,2,4,balanced,0.7011520067850748
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,128,2,4,power_law_1.01,0.5295872211456298
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,128,2,4,power_law_1.01,0.6144896030426026
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,128,2,4,balanced,1.032421350479126
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,128,2,4,power_law_1.01,0.8540096282958984
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,128,2,4,power_law_1.01,1.0270015716552734
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,128,2,4,power_law_1.2,0.07077760100364686
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,128,2,4,power_law_1.01,1.499839973449707
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,128,1,8,balanced,5.160458564758301
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,128,2,4,power_law_1.2,0.09000319838523865
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,128,2,4,power_law_1.01,1.8435583114624023
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,128,2,4,balanced,1.363141377766927
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,128,2,4,power_law_1.2,0.06728320121765137
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,128,2,4,power_law_1.01,2.2595199584960937
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,128,2,4,power_law_1.2,0.07448319792747497
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,128,2,4,power_law_1.01,3.7521087646484377
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,128,2,4,power_law_1.2,0.07883520126342773
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,128,2,4,power_law_1.2,0.08213760256767273
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,128,2,4,power_law_1.01,8.057196807861327
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,128,2,4,balanced,1.6933919588724773
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,128,4,2,balanced,0.03436800092458725
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,128,2,4,power_law_1.2,0.08700159788131714
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,128,4,2,balanced,0.04043733328580856
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,128,2,4,power_law_1.2,0.09797760248184204
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,128,4,2,balanced,0.0429013321797053
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,128,2,4,power_law_1.2,0.09473279714584351
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,128,4,2,balanced,0.0652159998814265
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,128,2,4,power_law_1.2,0.10660480260848999
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,128,2,4,power_law_1.2,0.11237119436264038
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,128,4,2,balanced,0.07965333263079326
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,128,2,4,power_law_1.2,0.12083840370178223
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,128,2,4,balanced,2.6919094721476235
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,128,4,2,balanced,0.11182933052380879
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,128,2,4,power_law_1.2,0.1268288016319275
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,128,4,2,balanced,0.11261866490046184
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,128,2,4,power_law_1.2,0.13824000358581542
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,128,4,2,balanced,0.11328533291816711
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,128,2,4,power_law_1.2,0.1630911946296692
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,128,4,2,balanced,0.11291733384132385
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,128,4,2,balanced,0.11355200409889221
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,128,2,4,power_law_1.2,0.1734655976295471
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,128,2,4,power_law_1.2,0.18685439825057984
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,128,4,2,balanced,0.11381866534550984
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,128,2,4,power_law_1.2,0.3485759973526001
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,128,4,2,balanced,0.11399466792742412
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,128,2,4,power_law_1.2,0.3895359992980957
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,128,4,2,balanced,0.11408000191052754
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,128,2,4,power_law_1.2,0.41603841781616213
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,128,4,2,balanced,0.11512533823649089
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,128,2,4,power_law_1.2,0.46947197914123534
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,128,4,2,balanced,0.130703995625178
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,128,2,4,power_law_1.2,0.6109375953674316
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,128,2,4,balanced,5.326357205708821
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,128,2,4,power_law_1.2,0.7269120216369629
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,128,4,2,balanced,0.13173333803812662
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,128,4,2,balanced,0.13377599914868674
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,128,2,4,power_law_1.2,0.9507840156555176
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,128,2,4,power_law_1.2,1.0874176025390625
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,128,4,2,balanced,0.17124267419179282
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,128,2,4,power_law_1.2,1.7049663543701172
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,128,4,2,balanced,0.1759893298149109
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,128,2,4,power_law_1.2,2.057606315612793
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,128,4,2,balanced,0.33844268321990967
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,128,2,4,power_law_1.2,2.4611839294433593
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,128,4,2,balanced,0.34761067231496173
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,128,4,2,power_law_1.01,0.03490560054779053
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,128,2,4,power_law_1.2,3.8214080810546873
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,128,4,2,power_law_1.01,0.0421887993812561
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,128,4,2,balanced,0.3696266810099284
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,128,4,2,power_law_1.01,0.04451839923858643
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,128,2,4,power_law_1.2,9.100959777832031
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,128,4,2,power_law_1.01,0.06116480231285095
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,128,4,2,balanced,0.3906186819076538
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,128,4,2,power_law_1.01,0.06601600050926208
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,128,4,2,power_law_1.01,0.07930240035057068
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,128,4,2,balanced,0.6929972966512045
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,128,4,2,power_law_1.01,0.09290239810943604
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,128,4,2,power_law_1.01,0.09527040123939515
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,128,4,2,power_law_1.01,0.10093439817428589
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,128,4,2,balanced,0.7355733712514242
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,128,4,2,power_law_1.01,0.10058239698410035
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,128,4,2,power_law_1.01,0.10651520490646363
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,128,4,2,power_law_1.01,0.1117184042930603
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,128,4,2,power_law_1.01,0.11463040113449097
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,128,4,2,balanced,1.0806667009989421
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,128,4,2,power_law_1.01,0.126803195476532
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,128,4,2,power_law_1.01,0.1329408049583435
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,128,4,2,power_law_1.01,0.13698559999465942
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,128,4,2,power_law_1.01,0.15438079833984375
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,128,4,2,power_law_1.01,0.19302400350570678
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,128,4,2,balanced,1.427061398824056
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,128,4,2,power_law_1.01,0.21114881038665773
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,128,4,2,power_law_1.01,0.38886399269104005
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,128,4,2,power_law_1.01,0.4532032012939453
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,128,4,2,power_law_1.01,0.5101183891296387
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,128,4,2,power_law_1.01,0.6115903854370117
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,128,4,2,power_law_1.01,0.7925119876861573
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,128,4,2,balanced,1.769968032836914
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,128,4,2,power_law_1.01,0.9937151908874512
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,128,4,2,power_law_1.01,1.406112003326416
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,128,4,2,power_law_1.01,1.6944063186645508
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,128,8,1,balanced,0.028010666370391846
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,128,4,2,power_law_1.2,0.035366401076316833
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,128,4,2,power_law_1.01,2.0595071792602537
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,128,8,1,balanced,0.03254933406909307
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,128,4,2,power_law_1.2,0.04199680089950562
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,128,4,2,power_law_1.01,3.1332799911499025
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,128,8,1,balanced,0.03805333375930786
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,128,4,2,power_law_1.2,0.044268798828125
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,128,8,1,balanced,0.05648533503214518
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,128,4,2,power_law_1.01,7.035417938232422
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,128,4,2,power_law_1.2,0.05989760160446167
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,128,4,2,balanced,2.809077262878418
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,128,8,1,power_law_1.01,0.027577599883079527
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,128,4,2,power_law_1.2,0.06336640119552613
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,128,8,1,balanced,0.08222400148709615
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,128,8,1,power_law_1.01,0.03235200047492981
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,128,4,2,power_law_1.2,0.07930880188941955
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,128,8,1,balanced,0.11961066722869873
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,128,8,1,power_law_1.01,0.036601600050926206
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,128,4,2,power_law_1.2,0.08724480271339416
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,128,8,1,balanced,0.11402666568756104
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,128,8,1,power_law_1.01,0.04912000000476837
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,128,4,2,power_law_1.2,0.09489279985427856
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,128,8,1,balanced,0.11353066563606262
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,128,4,2,power_law_1.2,0.09512959718704224
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,128,8,1,power_law_1.01,0.06199679970741272
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,128,8,1,balanced,0.11428800225257874
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,128,4,2,power_law_1.2,0.09690240025520325
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,128,8,1,power_law_1.01,0.0726144015789032
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,128,4,2,power_law_1.2,0.10949759483337403
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,128,8,1,balanced,0.11404800415039062
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,128,8,1,power_law_1.01,0.09068160057067871
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,128,8,1,power_law_1.2,0.027526399493217467
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,128,8,1,balanced,0.11370666821797688
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,128,4,2,power_law_1.2,0.11119359731674194
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,128,8,1,power_law_1.01,0.09397119879722596
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,128,8,1,power_law_1.2,0.031148800253868104
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,128,8,1,balanced,0.11454400420188904
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,128,4,2,power_law_1.2,0.12104959487915039
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,128,8,1,power_law_1.01,0.09584640264511109
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,128,8,1,power_law_1.2,0.035980799794197084
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,128,8,1,balanced,0.11493866642316182
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,128,4,2,power_law_1.2,0.1283519983291626
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,128,8,1,power_law_1.01,0.09747200012207032
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,128,8,1,power_law_1.2,0.04682239890098572
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,128,8,1,balanced,0.11559999982515971
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,128,4,2,power_law_1.2,0.1346560001373291
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,128,8,1,power_law_1.01,0.10467840433120727
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,128,4,2,power_law_1.2,0.14993280172348022
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,128,8,1,balanced,0.11672000090281169
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,128,8,1,power_law_1.2,0.05889279842376709
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,128,8,1,power_law_1.01,0.10867840051651001
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,128,4,2,power_law_1.2,0.15828479528427125
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,128,4,2,balanced,5.56278928120931
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,128,8,1,balanced,0.118559996287028
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,128,8,1,power_law_1.2,0.06647679805755616
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,128,4,2,power_law_1.2,0.21532800197601318
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,128,8,1,power_law_1.01,0.11096960306167603
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,128,8,1,balanced,0.12211199601491292
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,128,8,1,power_law_1.2,0.08488960266113281
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,128,4,2,power_law_1.2,0.2318592071533203
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,128,8,1,power_law_1.01,0.12325119972229004
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,128,4,2,power_law_1.2,0.42175998687744143
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,128,8,1,balanced,0.14443199833234152
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,128,8,1,power_law_1.2,0.08563200235366822
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,128,8,1,power_law_1.01,0.13025280237197875
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,128,4,2,power_law_1.2,0.4748095989227295
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,128,8,1,balanced,0.14994666973749796
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,128,8,1,power_law_1.2,0.09329919815063477
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,128,4,2,power_law_1.2,0.5631487846374512
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,128,8,1,power_law_1.01,0.14168319702148438
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,128,4,2,power_law_1.2,0.6484928131103516
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,128,8,1,power_law_1.2,0.09587200284004212
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,128,8,1,power_law_1.01,0.16883840560913085
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,128,8,1,balanced,0.2016213337580363
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,128,4,2,power_law_1.2,0.8746687889099121
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,128,8,1,power_law_1.2,0.10181759595870972
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,128,8,1,power_law_1.01,0.18317439556121826
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,128,4,2,power_law_1.2,1.0288384437561036
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,128,8,1,balanced,0.21271467208862305
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,128,8,1,power_law_1.01,0.20621440410614014
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,128,4,2,power_law_1.2,1.4702464103698731
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,128,8,1,power_law_1.2,0.1076159954071045
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,128,4,2,power_law_1.2,1.884454345703125
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,128,8,1,balanced,0.4077226718266805
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,128,8,1,power_law_1.01,0.26464641094207764
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,128,8,1,power_law_1.2,0.11515519618988038
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,128,4,2,power_law_1.2,2.452403259277344
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,128,8,1,power_law_1.01,0.30593280792236327
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,128,8,1,power_law_1.2,0.12245759963989258
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,128,4,2,power_law_1.2,3.5033599853515627
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,128,8,1,balanced,0.43275733788808185
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,128,8,1,power_law_1.01,0.5448639869689942
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,128,8,1,power_law_1.2,0.13657599687576294
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,128,4,2,power_law_1.2,6.848274993896484
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,128,8,1,power_law_1.01,0.6352064132690429
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,128,8,1,power_law_1.2,0.14473600387573243
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,128,8,1,balanced,0.7683253288269043
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,128,8,1,power_law_1.01,0.8380224227905273
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,128,8,1,power_law_1.2,0.17310719490051268
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,128,8,1,power_law_1.01,1.015878391265869
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,128,8,1,power_law_1.2,0.18651520013809203
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,128,8,1,balanced,0.8170613447825114
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,128,8,1,power_law_1.01,1.3913344383239745
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,128,8,1,power_law_1.2,0.21418240070343017
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,128,8,1,power_law_1.01,1.7641920089721679
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,128,8,1,power_law_1.2,0.2722111940383911
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,128,8,1,balanced,1.196010669072469
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,128,8,1,power_law_1.2,0.32027521133422854
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,128,8,1,power_law_1.01,2.134252738952637
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,128,8,1,power_law_1.2,0.573747205734253
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,128,8,1,power_law_1.01,3.2620670318603517
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,32,1,8,balanced,0.056874667604764305
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,128,8,1,power_law_1.2,0.6684224128723144
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,128,8,1,power_law_1.01,6.261471939086914
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,128,8,1,power_law_1.2,0.8479424476623535
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,128,8,1,balanced,1.5742400487263997
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,32,1,8,balanced,0.058042665322621666
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,128,8,1,power_law_1.2,1.038707160949707
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,128,8,1,power_law_1.2,1.4133952140808106
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,32,1,8,balanced,0.06029866635799408
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,128,8,1,power_law_1.2,1.7716863632202149
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,128,8,1,balanced,1.9502399762471516
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,128,8,1,power_law_1.2,2.150374412536621
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,32,1,8,power_law_1.01,0.08732159733772278
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,32,1,8,balanced,0.05974400043487549
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,128,8,1,power_law_1.2,3.262284851074219
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,32,1,8,power_law_1.01,0.07275519967079162
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,128,8,1,power_law_1.2,6.256793594360351
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,32,1,8,power_law_1.01,0.07635200023651123
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,32,1,8,balanced,0.07156266768773396
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,32,1,8,power_law_1.01,0.05987200140953064
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,32,1,8,power_law_1.01,0.070387202501297
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,128,8,1,balanced,3.0824639002482095
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,32,1,8,balanced,0.07803733150164287
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,32,1,8,power_law_1.01,0.07757440209388733
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,32,1,8,balanced,0.07750399907430013
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,32,1,8,balanced,0.07924800117810567
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,32,1,8,power_law_1.01,0.08236799836158752
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,32,1,8,balanced,0.11335466305414836
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,32,1,8,power_law_1.01,0.07920640110969543
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,32,1,8,balanced,0.11276800433794658
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,32,1,8,power_law_1.01,0.11572480201721191
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,32,1,8,balanced,0.11339733004570007
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,32,1,8,power_law_1.01,0.11373440027236939
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,32,1,8,balanced,0.11295466621716817
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,32,1,8,power_law_1.01,0.11489280462265014
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,32,1,8,balanced,0.11297600467999776
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,128,8,1,balanced,6.103957494099935
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,32,1,8,power_law_1.01,0.11656960248947143
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,32,1,8,balanced,0.11367467045783997
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,32,1,8,power_law_1.01,0.11455999612808228
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,32,1,8,balanced,0.11395200093587239
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,32,1,8,power_law_1.2,0.07764480113983155
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,32,1,8,power_law_1.01,0.12624000310897826
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,32,1,8,balanced,0.11505066355069478
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,32,1,8,power_law_1.01,0.1403264045715332
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,32,1,8,power_law_1.2,0.06637439727783204
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,32,1,8,balanced,0.1163040002187093
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,32,1,8,power_law_1.01,0.15192320346832275
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,32,1,8,power_law_1.2,0.07000960111618042
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,32,1,8,balanced,0.11975466211636861
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,32,1,8,power_law_1.01,0.17920000553131105
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,32,1,8,power_law_1.2,0.05775359869003296
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,32,1,8,balanced,0.1220960021018982
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,32,1,8,power_law_1.01,0.20079998970031737
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,32,1,8,power_law_1.2,0.07079039812088013
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,32,1,8,balanced,0.19288533926010132
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,32,1,8,power_law_1.01,0.2241919994354248
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,32,1,8,power_law_1.2,0.07712640166282654
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,32,1,8,balanced,0.2014346718788147
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,32,1,8,power_law_1.01,0.2988032102584839
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,32,1,8,power_law_1.2,0.07722240090370178
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,32,1,8,power_law_1.01,0.38052480220794677
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,32,1,8,balanced,0.2965386708577474
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,32,1,8,power_law_1.2,0.08204799890518188
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,32,1,8,power_law_1.01,0.592844820022583
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,32,1,8,power_law_1.2,0.11641600131988525
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,32,1,8,balanced,0.34726933638254803
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,32,1,8,power_law_1.2,0.11354880332946778
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,32,1,8,power_law_1.01,0.835910415649414
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,32,1,8,power_law_1.2,0.11250560283660889
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,32,1,8,power_law_1.01,1.1157119750976563
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,32,1,8,balanced,0.5192960103352865
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,32,1,8,power_law_1.2,0.11695359945297241
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,32,1,8,power_law_1.01,1.2073792457580566
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,32,1,8,power_law_1.2,0.11682560443878173
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,32,1,8,power_law_1.01,2.2234111785888673
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,32,1,8,power_law_1.2,0.1280959963798523
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,32,1,8,balanced,0.6679893334706625
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,32,2,4,balanced,0.0459199994802475
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,32,1,8,power_law_1.2,0.16241919994354248
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,32,1,8,power_law_1.01,2.8559167861938475
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,32,1,8,power_law_1.2,0.15289599895477296
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,32,1,8,power_law_1.01,3.123910331726074
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,32,2,4,balanced,0.05156800150871277
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,32,1,8,power_law_1.2,0.18328959941864015
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,32,1,8,balanced,0.985706647237142
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,32,1,8,power_law_1.01,5.858054351806641
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,32,1,8,power_law_1.2,0.21887359619140626
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,32,2,4,balanced,0.05412266651789347
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,32,1,8,power_law_1.2,0.28677759170532224
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,32,2,4,power_law_1.01,0.06036480069160462
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,32,1,8,power_law_1.01,10.448998260498048
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,32,2,4,balanced,0.06483733157316844
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,32,1,8,power_law_1.2,0.37207679748535155
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,32,2,4,balanced,0.056048000852266945
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,32,2,4,power_law_1.01,0.06230400204658508
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,32,1,8,power_law_1.2,0.49910402297973633
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,32,1,8,balanced,1.3054239749908447
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,32,2,4,balanced,0.05641066531340281
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,32,2,4,power_law_1.01,0.06661120057106018
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,32,1,8,power_law_1.2,0.6989183902740479
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,32,2,4,balanced,0.060640002290407814
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,32,2,4,power_law_1.01,0.06724479794502258
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,32,2,4,balanced,0.06106133262316386
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,32,1,8,power_law_1.2,0.7756800174713134
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,32,2,4,power_law_1.01,0.05451520085334778
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,32,2,4,balanced,0.06809066732724507
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,32,1,8,power_law_1.2,1.4554752349853515
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,32,2,4,power_law_1.01,0.05516800284385681
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,32,2,4,balanced,0.06861866513888042
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,32,2,4,power_law_1.01,0.05984640121459961
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,32,2,4,balanced,0.0690719981988271
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,32,1,8,balanced,1.6219733556111653
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,32,1,8,power_law_1.2,2.1786880493164062
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,32,2,4,balanced,0.11742400129636128
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,32,2,4,power_law_1.01,0.06040319800376892
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,32,1,8,power_law_1.2,3.50445442199707
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,32,2,4,balanced,0.11738133430480957
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,32,2,4,power_law_1.01,0.06980479955673217
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,32,2,4,balanced,0.11749333143234253
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,32,2,4,power_law_1.01,0.07218559980392455
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,32,1,8,power_law_1.2,4.076236724853516
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,32,2,4,balanced,0.11813333630561829
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,32,2,4,power_law_1.01,0.0704576015472412
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,32,1,8,power_law_1.2,4.754924774169922
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,32,2,4,power_law_1.01,0.11807359457015991
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,32,2,4,balanced,0.11906133095423381
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,32,2,4,power_law_1.01,0.11951999664306641
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,32,2,4,balanced,0.12037332852681477
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,32,1,8,power_law_1.2,8.850969696044922
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,32,2,4,power_law_1.01,0.12276480197906495
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,32,1,8,balanced,2.5787199338277182
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,32,2,4,balanced,0.12378666798273723
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,32,2,4,power_law_1.01,0.12284159660339355
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,32,2,4,power_law_1.01,0.1245695948600769
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,32,2,4,balanced,0.12635200222333273
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,32,1,8,power_law_1.2,20.472256469726563
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,32,2,4,power_law_1.01,0.15545599460601806
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,32,2,4,power_law_1.2,0.0650111973285675
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,32,2,4,power_law_1.01,0.17944320440292358
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,32,2,4,balanced,0.18141865730285645
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,32,2,4,power_law_1.01,0.21148159503936767
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,32,2,4,power_law_1.2,0.06666240096092224
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,32,2,4,power_law_1.01,0.2695807933807373
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,32,2,4,balanced,0.1907786726951599
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,32,2,4,power_law_1.2,0.0639743983745575
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,32,2,4,power_law_1.01,0.3450495958328247
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,32,2,4,power_law_1.2,0.06863999962806702
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,32,2,4,balanced,0.28837867577870685
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,32,2,4,power_law_1.01,0.43535361289978025
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,32,2,4,power_law_1.2,0.0554751992225647
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,32,2,4,power_law_1.01,0.6166016101837158
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,32,2,4,balanced,0.35709333419799805
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,32,2,4,power_law_1.01,0.9800255775451661
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,32,2,4,power_law_1.2,0.05763840079307556
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,32,2,4,power_law_1.01,1.092569637298584
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,32,4,2,balanced,0.03311999887228012
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,32,2,4,power_law_1.2,0.061247998476028444
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,32,2,4,balanced,0.5233120123545328
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,32,2,4,power_law_1.01,2.292620849609375
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,32,4,2,balanced,0.03860799968242645
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,32,2,4,power_law_1.2,0.06352000236511231
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,32,2,4,power_law_1.01,2.5081600189208983
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,32,2,4,power_law_1.2,0.07049599885940552
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,32,2,4,balanced,0.6871306896209717
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,32,4,2,balanced,0.040976000328858696
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,32,1,8,balanced,5.1236371994018555
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,32,2,4,power_law_1.01,3.2668609619140625
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,32,2,4,power_law_1.2,0.07093120217323304
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,32,2,4,power_law_1.2,0.07128319740295411
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,32,4,2,balanced,0.06217599908510844
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,32,2,4,power_law_1.01,3.9441280364990234
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,32,2,4,power_law_1.2,0.11907199621200562
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,32,4,2,balanced,0.056015998125076294
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,32,2,4,power_law_1.01,10.548102569580077
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,32,2,4,balanced,1.015760024388631
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,32,2,4,power_law_1.2,0.12509440183639525
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,32,4,2,balanced,0.056405335664749146
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,32,2,4,power_law_1.2,0.12184319496154786
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,32,4,2,balanced,0.0565226674079895
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,32,2,4,power_law_1.2,0.12558720111846924
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,32,4,2,balanced,0.05705066521962484
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,32,2,4,power_law_1.2,0.1455423951148987
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,32,4,2,balanced,0.05850133299827576
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,32,2,4,balanced,1.3446346918741863
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,32,2,4,power_law_1.2,0.158406400680542
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,32,4,2,balanced,0.058970664938290916
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,32,2,4,power_law_1.2,0.1795583963394165
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,32,4,2,balanced,0.05972266693909963
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,32,4,2,balanced,0.0713919997215271
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,32,2,4,power_law_1.2,0.21989119052886963
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,32,4,2,balanced,0.07070399820804596
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,32,2,4,power_law_1.2,0.2878528118133545
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,32,2,4,balanced,1.6730507214864094
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,32,4,2,balanced,0.07181333502133687
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,32,2,4,power_law_1.2,0.35019519329071047
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,32,4,2,balanced,0.1123253305753072
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,32,2,4,power_law_1.2,0.45544958114624023
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,32,4,2,balanced,0.11327466368675232
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,32,2,4,power_law_1.2,0.6855487823486328
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,32,4,2,balanced,0.11500266194343567
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,32,2,4,power_law_1.2,0.9811840057373047
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,32,4,2,balanced,0.1188106636206309
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,32,4,2,power_law_1.01,0.033907198905944826
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,32,4,2,balanced,0.12299733360608418
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,32,2,4,power_law_1.2,1.1915136337280274
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,32,4,2,balanced,0.19084266821543375
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,32,4,2,power_law_1.01,0.03863680064678192
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,32,2,4,power_law_1.2,1.7445184707641601
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,32,4,2,balanced,0.2000053326288859
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,32,4,2,power_law_1.01,0.04039680063724518
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,32,2,4,balanced,2.6615039507548013
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,32,2,4,power_law_1.2,2.9833919525146486
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,32,4,2,power_law_1.01,0.04935680031776428
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,32,4,2,balanced,0.298309326171875
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,32,2,4,power_law_1.2,3.464863967895508
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,32,4,2,power_law_1.01,0.05568640232086182
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,32,4,2,balanced,0.37652266025543213
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,32,2,4,power_law_1.2,4.313625717163086
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,32,4,2,power_law_1.01,0.05564799904823303
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,32,4,2,power_law_1.01,0.060499197244644164
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,32,4,2,balanced,0.5505013465881348
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,32,2,4,power_law_1.2,12.004032135009766
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,32,4,2,power_law_1.01,0.06458240151405334
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,32,4,2,balanced,0.7244853178660074
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,32,4,2,power_law_1.01,0.06641280055046081
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,32,4,2,power_law_1.01,0.06956160068511963
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,32,4,2,power_law_1.01,0.07332479953765869
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,32,4,2,balanced,1.0632212956746419
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,32,4,2,power_law_1.01,0.0717631995677948
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,32,4,2,power_law_1.01,0.07329919934272766
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,32,4,2,power_law_1.01,0.07723519802093506
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,32,2,4,balanced,5.2936960856119795
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,32,4,2,balanced,1.4009226163228352
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,32,4,2,power_law_1.01,0.1251711964607239
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,32,4,2,power_law_1.01,0.1307904005050659
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,32,4,2,power_law_1.01,0.1443519949913025
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,32,4,2,power_law_1.01,0.1729472041130066
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,32,4,2,balanced,1.743578592936198
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,32,4,2,power_law_1.01,0.19397120475769042
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,32,4,2,power_law_1.2,0.03307519853115082
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,32,4,2,power_law_1.01,0.2398591995239258
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,32,4,2,power_law_1.2,0.037887999415397645
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,32,4,2,power_law_1.01,0.28231680393218994
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,32,4,2,power_law_1.2,0.04133760035037994
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,32,4,2,power_law_1.01,0.39071359634399416
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,32,4,2,power_law_1.2,0.050892800092697144
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,32,4,2,power_law_1.01,0.5234047889709472
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,32,4,2,power_law_1.2,0.05544959902763367
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,32,4,2,power_law_1.01,0.7069632053375244
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,32,4,2,balanced,2.7766825358072915
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,32,4,2,power_law_1.2,0.0574400007724762
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,32,4,2,power_law_1.01,0.9112447738647461
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,32,4,2,power_law_1.2,0.06235520243644714
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,32,4,2,power_law_1.01,1.4042559623718263
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,32,4,2,power_law_1.2,0.06490240097045899
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,32,4,2,power_law_1.01,2.0769088745117186
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,32,4,2,power_law_1.2,0.0689087986946106
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,32,4,2,power_law_1.01,2.235340881347656
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,32,4,2,power_law_1.2,0.07221760153770447
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,32,4,2,power_law_1.01,3.3547073364257813
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,32,4,2,power_law_1.2,0.07334399819374085
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,32,4,2,power_law_1.2,0.07235199809074402
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,32,4,2,power_law_1.01,7.419513702392578
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,32,8,1,balanced,0.027072000006834667
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,32,4,2,power_law_1.2,0.073471999168396
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,32,8,1,balanced,0.03145066648721695
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,32,4,2,power_law_1.2,0.07488639950752259
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,32,4,2,power_law_1.2,0.1309056043624878
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,32,8,1,balanced,0.036533333361148834
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,32,4,2,power_law_1.2,0.12947200536727904
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,32,8,1,balanced,0.054234668612480164
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,32,4,2,balanced,5.497045516967773
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,32,4,2,power_law_1.2,0.140447998046875
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,32,4,2,power_law_1.2,0.16927360296249389
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,32,8,1,balanced,0.05526933570702871
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,32,4,2,power_law_1.2,0.21431679725646974
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,32,8,1,balanced,0.05167999863624573
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,32,8,1,power_law_1.01,0.02656640112400055
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,32,8,1,balanced,0.05182399849096934
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,32,4,2,power_law_1.2,0.26010239124298096
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,32,8,1,power_law_1.01,0.029446399211883544
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,32,8,1,balanced,0.05173333485921224
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,32,4,2,power_law_1.2,0.29587841033935547
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,32,8,1,power_law_1.01,0.03487359881401062
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,32,8,1,balanced,0.05226666728655497
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,32,8,1,power_law_1.01,0.041075199842453
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,32,4,2,power_law_1.2,0.40320000648498533
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,32,8,1,balanced,0.0525493323802948
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,32,8,1,power_law_1.01,0.05366399884223938
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,32,4,2,power_law_1.2,0.5821760177612305
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,32,8,1,power_law_1.01,0.05077760219573975
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,32,8,1,balanced,0.05207466582457224
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,32,4,2,power_law_1.2,0.7437183856964111
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,32,8,1,power_law_1.2,0.026630398631095887
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,32,8,1,power_law_1.01,0.05240319967269898
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,32,8,1,balanced,0.05727999905745188
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,32,4,2,power_law_1.2,0.9241408348083496
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,32,8,1,power_law_1.2,0.029523199796676634
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,32,8,1,power_law_1.01,0.05306239724159241
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,32,8,1,balanced,0.05754133562246958
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,32,4,2,power_law_1.2,1.6483200073242188
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,32,8,1,power_law_1.01,0.05863040089607239
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,32,8,1,power_law_1.2,0.03251200020313263
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,32,8,1,balanced,0.05787200232346853
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,32,4,2,power_law_1.2,2.004435157775879
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,32,8,1,power_law_1.01,0.06304640173912049
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,32,8,1,power_law_1.2,0.04123519957065582
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,32,8,1,balanced,0.0684746652841568
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,32,8,1,power_law_1.01,0.06520959734916687
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,32,8,1,power_law_1.2,0.05319679975509643
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,32,4,2,power_law_1.2,2.437599945068359
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,32,8,1,balanced,0.07035199801127116
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,32,8,1,power_law_1.01,0.07043840289115906
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,32,8,1,power_law_1.2,0.05081599950790405
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,32,4,2,power_law_1.2,3.9871360778808596
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,32,8,1,balanced,0.07261866827805837
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,32,8,1,power_law_1.01,0.06851840019226074
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,32,8,1,power_law_1.2,0.05287039875984192
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,32,8,1,balanced,0.1252959966659546
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,32,8,1,power_law_1.01,0.07383040189743043
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,32,4,2,power_law_1.2,8.44037094116211
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,32,8,1,power_law_1.2,0.053286397457122804
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,32,8,1,power_law_1.01,0.07861760258674622
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,32,8,1,balanced,0.12971199552218118
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,32,8,1,power_law_1.2,0.060659199953079224
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,32,8,1,power_law_1.01,0.09402880072593689
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,32,8,1,power_law_1.2,0.06318079829216003
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,32,8,1,balanced,0.2077653408050537
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,32,8,1,power_law_1.01,0.10072959661483764
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,32,8,1,power_law_1.2,0.06625279784202576
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,32,8,1,power_law_1.01,0.16860159635543823
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,32,8,1,balanced,0.21766400337219238
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,32,8,1,power_law_1.2,0.06869120001792908
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,32,8,1,power_law_1.01,0.18539520502090454
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,32,8,1,power_law_1.2,0.07236480116844177
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,32,8,1,balanced,0.32683734099070233
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,32,8,1,power_law_1.01,0.23525760173797608
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,32,8,1,power_law_1.2,0.07528960108757018
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,32,8,1,power_law_1.01,0.27614080905914307
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,32,8,1,balanced,0.41655464967091876
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,32,8,1,power_law_1.2,0.07591040134429931
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,32,8,1,power_law_1.01,0.37511680126190183
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,32,8,1,power_law_1.2,0.09437440037727356
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,32,8,1,power_law_1.01,0.46241278648376466
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,32,8,1,balanced,0.6072746515274048
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,32,8,1,power_law_1.2,0.10243840217590332
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,4096,14336,2,8,2,8,balanced,0.07522666454315186
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,32,8,1,power_law_1.01,0.6568895816802979
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,32,8,1,power_law_1.2,0.1686911940574646
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,4096,14336,2,8,2,8,balanced,0.07293866574764252
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,32,8,1,power_law_1.01,0.8469056129455567
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,32,8,1,balanced,0.7994773387908936
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,32,8,1,power_law_1.2,0.18534400463104247
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,4096,14336,2,8,2,8,balanced,0.07287466526031494
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,32,8,1,power_law_1.01,1.2201791763305665
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,32,8,1,power_law_1.2,0.23617920875549317
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,4096,14336,2,8,2,8,balanced,0.0729013333717982
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,32,8,1,power_law_1.01,1.5960512161254883
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,4096,14336,2,8,2,8,balanced,0.05695466697216034
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,32,8,1,power_law_1.2,0.27448320388793945
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,4096,14336,2,8,2,8,balanced,0.07403199871381123
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,32,8,1,balanced,1.1757226785024006
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,32,8,1,power_law_1.01,1.9729536056518555
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,4096,14336,2,8,2,8,balanced,0.056128000219662987
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,32,8,1,power_law_1.2,0.3774463891983032
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,4096,14336,2,8,2,8,balanced,0.07471466561158498
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,4096,14336,2,8,2,8,balanced,0.05489066739877065
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,32,8,1,power_law_1.01,3.098841667175293
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,4096,14336,2,8,2,8,balanced,0.07448533177375793
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,32,8,1,power_law_1.2,0.4628159999847412
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,4096,14336,2,8,2,8,balanced,0.05778666834036509
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,4096,14336,2,8,2,8,balanced,0.07423999905586243
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,32,8,1,power_law_1.2,0.6576704025268555
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,32,8,1,power_law_1.01,6.094009780883789
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,4096,14336,2,8,2,8,balanced,0.058821335434913635
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,4096,14336,2,8,2,8,balanced,0.07773866752783458
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,32,8,1,power_law_1.2,0.8507200241088867
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,32,8,1,balanced,1.5491573015848796
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,4096,14336,2,8,2,8,balanced,0.059434667229652405
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,4096,14336,2,8,2,8,balanced,0.07755200068155925
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,32,8,1,power_law_1.2,1.2271167755126953
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,4096,14336,2,8,2,8,balanced,0.059343998630841575
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,4096,14336,2,8,2,8,balanced,0.07638399799664815
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,32,8,1,power_law_1.2,1.6001728057861329
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,4096,14336,2,8,2,8,balanced,0.0595413347085317
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,4096,14336,2,8,2,8,balanced,0.07967466612656911
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,4096,14336,2,8,2,8,balanced,0.08133866886297862
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,4096,14336,2,8,2,8,balanced,0.059658666451772056
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,32,8,1,power_law_1.2,1.9725376129150392
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,4096,14336,2,8,2,8,balanced,0.060592000683148704
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,32,8,1,balanced,1.9240907033284504
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,4096,14336,2,8,2,8,balanced,0.08920533458391826
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,32,8,1,power_law_1.2,3.0976703643798826
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,4096,14336,2,8,2,8,balanced,0.06095466514428457
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,4096,14336,2,8,2,8,balanced,0.09057066837946574
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,4096,14336,2,8,2,8,balanced,0.060090666015942894
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,32,8,1,power_law_1.2,6.104723358154297
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,4096,14336,2,8,2,8,balanced,0.08905599514643352
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,4096,14336,2,8,2,8,balanced,0.06084266801675161
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,4096,14336,2,8,2,8,balanced,0.105103999376297
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,4096,14336,2,8,2,8,balanced,0.06355733176072438
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,4096,14336,2,8,2,8,balanced,0.10669333736101787
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,4096,14336,2,8,2,8,balanced,0.0703893353541692
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,4096,14336,2,8,2,8,balanced,0.11904533704121907
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,4096,14336,2,8,2,8,balanced,0.07172266642252605
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,4096,14336,2,8,2,8,balanced,0.18360533316930136
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,32,8,1,balanced,3.0424159367879233
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,4096,14336,2,8,2,8,balanced,0.07092800239721934
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,4096,14336,2,8,2,8,balanced,0.16313067078590393
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,4096,14336,2,8,2,8,balanced,0.08779733379681905
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,4096,14336,2,8,2,8,balanced,0.24683199326197305
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,4096,14336,2,8,2,8,balanced,0.09205866853396098
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,4096,14336,2,8,2,8,balanced,0.2853599985440572
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,4096,14336,2,8,2,8,balanced,0.12406933307647705
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,4096,14336,2,8,2,8,power_law_1.01,0.07194240093231201
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,4096,14336,2,8,2,8,balanced,0.1288159986337026
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,4096,14336,2,8,2,8,balanced,0.4469013214111328
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,4096,14336,2,8,2,8,balanced,0.18345600366592407
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,4096,14336,2,8,2,8,power_law_1.01,0.07184000015258789
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,4096,14336,2,8,2,8,balanced,0.49701865514119464
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,4096,14336,2,8,2,8,power_law_1.01,0.0717248022556305
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,4096,14336,2,8,2,8,balanced,0.2172586719195048
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,4096,14336,2,8,2,8,power_law_1.01,0.07226880192756653
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,4096,14336,2,8,2,8,balanced,0.049178664882977806
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,4096,14336,2,8,2,8,power_law_1.01,0.07281280159950257
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,4096,14336,2,8,2,8,balanced,0.32550400495529175
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,4096,14336,2,8,2,8,balanced,0.7482720216115316
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,4096,14336,2,8,2,8,balanced,0.047797332207361855
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,4096,14336,2,8,2,8,power_law_1.01,0.07683839797973632
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,4096,14336,2,8,2,8,balanced,0.04770666857560476
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,4096,14336,2,8,2,8,balanced,0.050383999943733215
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,4096,14336,2,8,2,8,balanced,0.3765759865442912
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,4096,14336,2,8,2,8,power_law_1.01,0.07800319790840149
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,4096,14336,2,8,2,8,balanced,0.05179733534653982
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,4096,14336,2,8,2,8,power_law_1.01,0.08606079816818238
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,4096,14336,2,8,2,8,balanced,0.9605600039164225
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,4096,14336,2,8,2,8,balanced,0.05231466889381409
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,32,8,1,balanced,6.0456587473551435
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,4096,14336,2,8,2,8,balanced,0.05263466636339823
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,4096,14336,2,8,2,8,power_law_1.01,0.24323201179504395
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,4096,14336,2,8,2,8,balanced,0.5530826648076376
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,4096,14336,2,8,2,8,balanced,0.052709331115086876
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,4096,14336,2,8,2,8,power_law_1.01,0.7107456207275391
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,4096,14336,2,8,2,8,balanced,1.1767093340555828
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,4096,14336,2,8,2,8,power_law_1.01,0.8376895904541015
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,4096,14336,2,8,2,8,balanced,0.0535093347231547
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,4096,14336,2,8,2,8,balanced,0.7116959889729818
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,4096,14336,2,8,2,8,power_law_1.01,0.8874624252319336
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,4096,14336,2,8,2,8,balanced,0.054527997970581055
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,4096,14336,2,8,2,8,power_law_1.01,0.9011775970458984
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,4096,14336,2,8,2,8,power_law_1.01,0.12307840585708618
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,4096,14336,2,8,2,8,balanced,0.8690826892852783
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,4096,14336,2,8,2,8,balanced,1.9213226636250813
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,4096,14336,2,8,2,8,power_law_1.01,0.16073600053787232
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,4096,14336,2,8,2,8,power_law_1.01,0.16776319742202758
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,4096,14336,2,8,2,8,balanced,0.054048001766204834
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,4096,14336,2,8,2,8,power_law_1.01,0.17811199426651
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,4096,14336,2,8,2,8,balanced,0.05554133156935374
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,4096,14336,2,8,2,8,power_law_1.01,0.24958720207214355
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,4096,14336,2,8,2,8,balanced,1.4030613899230957
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,4096,14336,2,8,2,8,balanced,0.05625066657861074
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,4096,14336,2,8,2,8,power_law_1.01,0.28901119232177735
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,4096,14336,2,8,2,8,balanced,0.055674667159716286
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,4096,14336,2,8,2,8,power_law_1.01,0.05201280117034912
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,4096,14336,2,8,2,8,power_law_1.01,0.3736448049545288
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,4096,14336,2,8,2,8,power_law_1.01,0.05443199872970581
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,4096,14336,2,8,2,8,power_law_1.01,0.5021376132965087
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,4096,14336,2,8,2,8,balanced,3.717520078023275
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,4096,14336,2,8,2,8,power_law_1.01,0.0531328022480011
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,4096,14336,2,8,2,8,power_law_1.01,0.7528575897216797
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,4096,14336,2,8,2,8,power_law_1.01,0.05606399774551392
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,4096,14336,2,8,2,8,power_law_1.01,0.8955007553100586
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,4096,14336,2,8,2,8,power_law_1.01,0.05622400045394897
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,4096,14336,2,8,2,8,balanced,0.06400000055631001
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,4096,14336,2,8,2,8,power_law_1.01,1.34716796875
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,4096,14336,2,8,2,8,power_law_1.01,0.057555198669433594
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,4096,14336,2,8,2,8,balanced,2.7128480275472007
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,4096,14336,2,8,2,8,balanced,0.06577066580454509
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,4096,14336,2,8,2,8,power_law_1.01,1.7723392486572265
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,4096,14336,2,8,2,8,balanced,0.06632000207901001
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,4096,14336,2,8,2,8,power_law_1.01,0.06288639903068542
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,4096,14336,2,8,2,8,power_law_1.01,2.764396858215332
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,4096,14336,2,8,2,8,power_law_1.01,0.06561279892921448
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,4096,14336,2,8,2,8,power_law_1.01,0.06993280053138733
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,4096,14336,2,8,2,8,balanced,0.08483200271924336
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,4096,14336,2,8,2,8,power_law_1.01,3.4294910430908203
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,4096,14336,2,8,2,8,balanced,0.08876799543698628
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,4096,14336,2,8,2,8,power_law_1.01,0.0768064022064209
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,4096,14336,2,8,2,8,power_law_1.01,3.9410945892333986
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,4096,14336,2,8,2,8,power_law_1.01,0.06711680293083191
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,4096,14336,2,8,2,8,power_law_1.01,7.2725372314453125
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,4096,14336,2,8,2,8,power_law_1.01,0.0769599974155426
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,4096,14336,2,8,2,8,balanced,0.11577066779136658
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,4096,14336,2,8,2,8,power_law_1.01,0.08750720024108886
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,4096,14336,2,8,2,8,power_law_1.01,15.0914306640625
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,4096,14336,2,8,2,8,power_law_1.01,0.09403520226478576
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,4096,14336,2,8,2,8,power_law_1.01,0.11844480037689209
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,4096,14336,2,8,2,8,balanced,0.13942399621009827
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,4096,14336,2,8,2,8,power_law_1.01,0.12599040269851686
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,4096,14336,2,8,2,8,balanced,0.20165334145228067
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,4096,14336,2,8,2,8,power_law_1.01,0.11832959651947021
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,4096,14336,2,8,2,8,balanced,0.23895466327667236
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,4096,14336,2,8,2,8,power_law_1.01,0.17895040512084961
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,4096,14336,2,8,2,8,power_law_1.01,0.20492799282073976
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,4096,14336,2,8,2,8,power_law_1.01,0.29665920734405515
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,4096,14336,2,8,2,8,power_law_1.01,0.2871040105819702
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,4096,14336,2,8,2,8,balanced,0.37353066603342694
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,4096,14336,2,8,2,8,power_law_1.01,0.4673151969909668
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,4096,14336,2,8,2,8,power_law_1.01,0.046982398629188536
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,4096,14336,2,8,2,8,power_law_1.01,0.5820864200592041
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,4096,14336,2,8,2,8,balanced,0.47166399161020917
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,4096,14336,2,8,2,8,power_law_1.01,0.8094655990600585
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,4096,14336,2,8,2,8,power_law_1.01,0.04726400077342987
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,4096,14336,2,8,2,8,balanced,0.7028000354766846
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,4096,14336,2,8,2,8,power_law_1.01,1.0379520416259767
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,4096,14336,2,8,2,8,power_law_1.01,0.04775680005550385
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,4096,14336,2,8,2,8,power_law_1.01,0.05041279792785645
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,4096,14336,2,8,2,8,power_law_1.01,1.685887908935547
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,4096,14336,2,8,2,8,balanced,0.9418346881866455
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,4096,14336,2,8,2,8,power_law_1.01,0.05115519762039185
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,4096,14336,2,8,2,8,power_law_1.2,0.07041919827461243
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,4096,14336,2,8,2,8,power_law_1.01,1.973593521118164
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,4096,14336,2,8,2,8,power_law_1.01,0.056627202033996585
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,4096,14336,2,8,2,8,power_law_1.2,0.07203199863433837
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,4096,14336,2,8,2,8,power_law_1.01,2.6960512161254884
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,4096,14336,2,8,2,8,power_law_1.01,0.06035839915275574
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,4096,14336,2,8,2,8,power_law_1.2,0.0719871997833252
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,4096,14336,2,8,2,8,balanced,1.157861312230428
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,4096,14336,2,8,2,8,power_law_1.01,4.092524719238281
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,4096,14336,2,8,2,8,power_law_1.01,0.06839680075645446
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,4096,14336,2,8,2,8,power_law_1.2,0.0725055992603302
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,4096,14336,2,8,2,8,power_law_1.2,0.07304319739341736
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,4096,14336,2,8,2,8,power_law_1.01,8.696383666992187
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,4096,14336,2,8,2,8,power_law_1.01,0.06947199702262878
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,4096,14336,2,8,2,8,power_law_1.2,0.07548800110816956
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,4096,14336,2,8,2,8,balanced,1.8354345957438152
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,4096,14336,2,8,2,8,power_law_1.01,0.07234560251235962
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,4096,14336,2,8,2,8,power_law_1.2,0.0813696026802063
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,4096,14336,2,8,2,8,power_law_1.2,0.08935040235519409
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,4096,14336,2,8,2,8,power_law_1.2,0.5576767921447754
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,4096,14336,2,8,2,8,power_law_1.01,0.07120640277862549
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,4096,14336,2,8,2,8,power_law_1.01,0.07917439937591553
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,4096,14336,2,8,2,8,power_law_1.2,0.7029568195343018
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,4096,14336,2,8,2,8,power_law_1.01,0.08762879967689514
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,4096,14336,2,8,2,8,power_law_1.2,0.850489616394043
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,4096,14336,2,8,2,8,power_law_1.01,0.09761279821395874
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,4096,14336,2,8,2,8,power_law_1.2,0.8741696357727051
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,4096,14336,2,8,2,8,balanced,3.6184374491373696
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,4096,14336,2,8,2,8,power_law_1.2,0.05464959740638733
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,4096,14336,2,8,2,8,power_law_1.2,0.910041618347168
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,4096,14336,2,8,2,8,power_law_1.2,0.05618559718132019
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,4096,14336,2,8,2,8,power_law_1.01,0.10483200550079345
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,4096,14336,2,8,2,8,power_law_1.2,0.12373119592666626
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,4096,14336,2,8,2,8,power_law_1.2,0.05446400046348572
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,4096,14336,2,8,2,8,power_law_1.01,0.11497600078582763
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,4096,14336,2,8,2,8,power_law_1.2,0.1598207950592041
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,4096,14336,2,8,2,8,power_law_1.2,0.0574400007724762
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,4096,14336,2,8,2,8,power_law_1.01,0.15045119524002076
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,4096,14336,2,8,2,8,power_law_1.2,0.17530879974365235
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,4096,14336,2,8,2,8,power_law_1.2,0.0575872004032135
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,4096,14336,2,8,2,8,power_law_1.2,0.1764415979385376
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,4096,14336,2,8,2,8,power_law_1.01,0.19367680549621583
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,4096,14336,2,8,2,8,power_law_1.2,0.05882880091667175
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,4096,14336,2,8,2,8,power_law_1.2,0.23303039073944093
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,4096,14336,2,8,2,8,power_law_1.01,0.25501439571380613
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,4096,14336,2,8,2,8,power_law_1.2,0.0642624020576477
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,4096,14336,2,8,2,8,power_law_1.2,0.2997503995895386
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,4096,14336,2,8,2,8,power_law_1.2,0.06275839805603027
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,4096,14336,2,8,2,8,power_law_1.2,0.4245312213897705
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,4096,14336,2,8,2,8,power_law_1.01,0.3579200029373169
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,4096,14336,2,8,2,8,power_law_1.2,0.0710528016090393
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,4096,14336,2,8,2,8,power_law_1.2,0.533132791519165
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,4096,14336,2,8,2,8,power_law_1.2,0.07912960052490234
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,4096,14336,2,8,2,8,power_law_1.01,0.3578304052352905
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,4096,14336,2,8,2,8,power_law_1.2,0.7880512237548828
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,4096,14336,2,8,2,8,power_law_1.2,0.07000319957733155
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,4096,14336,2,8,2,8,power_law_1.01,0.6515776157379151
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,4096,14336,2,8,2,8,power_law_1.2,0.9362560272216797
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,4096,14336,2,8,2,8,power_law_1.2,0.07769600152969361
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,4096,14336,2,8,2,8,power_law_1.01,0.8214528083801269
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,4096,14336,2,8,2,8,power_law_1.2,1.2538687705993652
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,4096,14336,2,8,2,8,power_law_1.2,0.0874176025390625
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,4096,14336,2,8,2,8,power_law_1.2,1.702841567993164
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,4096,14336,2,8,2,8,power_law_1.2,0.09489279985427856
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,4096,14336,2,8,2,8,power_law_1.01,1.343724822998047
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,4096,14336,2,8,2,8,power_law_1.2,0.10792959928512573
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,4096,14336,2,8,2,8,power_law_1.2,2.759494400024414
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,4096,14336,2,8,2,8,power_law_1.01,1.7196096420288085
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,4096,14336,2,8,2,8,power_law_1.2,0.12985600233078004
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,4096,14336,2,8,2,8,power_law_1.2,3.544492721557617
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,4096,14336,2,8,2,8,power_law_1.01,2.307571220397949
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,4096,14336,2,8,2,8,power_law_1.2,0.12277760505676269
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,4096,14336,2,8,2,8,power_law_1.01,3.31014404296875
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,4096,14336,2,8,2,8,power_law_1.2,4.269094467163086
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,4096,14336,2,8,2,8,power_law_1.2,0.17690240144729613
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,4096,14336,2,8,2,8,power_law_1.2,0.20873599052429198
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,4096,14336,2,8,2,8,power_law_1.01,4.255430221557617
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,4096,14336,2,8,2,8,power_law_1.2,7.4244224548339846
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,4096,14336,2,8,2,8,power_law_1.2,0.27546238899230957
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,4096,14336,2,8,4,4,balanced,0.05611733098824819
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,4096,14336,2,8,2,8,power_law_1.01,6.2798206329345705
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,4096,14336,2,8,2,8,power_law_1.2,0.2920703887939453
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,4096,14336,2,8,2,8,power_law_1.2,14.963743591308594
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,4096,14336,2,8,4,4,balanced,0.052853330969810486
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,4096,14336,2,8,2,8,power_law_1.2,0.4632256031036377
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,4096,14336,2,8,4,4,balanced,0.06677333513895671
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,4096,14336,2,8,2,8,power_law_1.01,13.3038330078125
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,4096,14336,2,8,2,8,power_law_1.2,0.04750080108642578
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,4096,14336,2,8,2,8,power_law_1.2,0.5349440097808837
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,4096,14336,2,8,4,4,balanced,0.06889066596825917
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,4096,14336,2,8,2,8,power_law_1.2,0.8083968162536621
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,4096,14336,2,8,2,8,power_law_1.2,0.04718720018863678
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,4096,14336,2,8,4,4,balanced,0.06954666475454967
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,4096,14336,2,8,2,8,power_law_1.2,1.0950016021728515
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,4096,14336,2,8,2,8,power_law_1.2,0.04785279929637909
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,4096,14336,2,8,4,4,balanced,0.07069333394368489
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,4096,14336,2,8,2,8,power_law_1.2,0.05103999972343445
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,4096,14336,2,8,2,8,power_law_1.2,1.7337472915649415
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,4096,14336,2,8,4,4,balanced,0.07054933408896129
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,4096,14336,2,8,4,4,balanced,0.044213334719340004
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,4096,14336,2,8,2,8,power_law_1.2,0.0514240026473999
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,4096,14336,2,8,4,4,balanced,0.07041599849859874
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,4096,14336,2,8,2,8,power_law_1.2,2.162009620666504
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,4096,14336,2,8,4,4,balanced,0.04190933207670847
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,4096,14336,2,8,4,4,balanced,0.07341333230336507
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,4096,14336,2,8,2,8,power_law_1.2,0.057120001316070555
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,4096,14336,2,8,4,4,balanced,0.05129066606362661
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,4096,14336,2,8,2,8,power_law_1.2,2.6689855575561525
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,4096,14336,2,8,4,4,balanced,0.07310933371384938
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,4096,14336,2,8,2,8,power_law_1.2,0.06346880197525025
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,4096,14336,2,8,4,4,balanced,0.053488001227378845
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,4096,14336,2,8,2,8,power_law_1.2,4.284262466430664
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,4096,14336,2,8,4,4,balanced,0.0772266685962677
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,4096,14336,2,8,2,8,power_law_1.2,0.06748800277709961
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,4096,14336,2,8,4,4,balanced,0.0545066644748052
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,4096,14336,2,8,4,4,balanced,0.07825066645940144
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,4096,14336,2,8,4,4,balanced,0.055349335074424744
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,4096,14336,2,8,2,8,power_law_1.2,8.957625579833984
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,4096,14336,2,8,2,8,power_law_1.2,0.08461440205574036
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,4096,14336,2,8,4,4,balanced,0.055205335219701133
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,4096,14336,2,8,4,4,balanced,0.0784853349129359
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,4096,14336,2,8,4,4,balanced,0.08538132905960083
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,4096,14336,2,8,4,4,balanced,0.05555733541647593
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,4096,14336,2,8,2,8,power_law_1.2,0.07952640056610108
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,4096,14336,2,8,4,4,balanced,0.09008533755938213
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,4096,14336,2,8,4,4,balanced,0.05713599920272827
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,4096,14336,2,8,4,4,balanced,0.09009599685668945
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,4096,14336,2,8,4,4,balanced,0.0572213331858317
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,4096,14336,2,8,4,4,balanced,0.10083733002344768
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,4096,14336,2,8,4,4,balanced,0.057087997595469155
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,4096,14336,2,8,2,8,power_law_1.2,0.07095680236816407
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,4096,14336,2,8,4,4,balanced,0.0584799995024999
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,4096,14336,2,8,4,4,balanced,0.10502400000890096
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,4096,14336,2,8,2,8,power_law_1.2,0.0832256019115448
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,4096,14336,2,8,4,4,balanced,0.060080001751581825
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,4096,14336,2,8,4,4,balanced,0.12917332847913107
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,4096,14336,2,8,2,8,power_law_1.2,0.09155200123786926
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,4096,14336,2,8,4,4,balanced,0.06073066592216492
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,4096,14336,2,8,4,4,balanced,0.15825066963831583
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,4096,14336,2,8,2,8,power_law_1.2,0.10872960090637207
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,4096,14336,2,8,4,4,balanced,0.07419200241565704
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,4096,14336,2,8,4,4,balanced,0.17068266868591309
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,4096,14336,2,8,4,4,balanced,0.07291199763615926
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,4096,14336,2,8,4,4,balanced,0.24091732501983643
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,4096,14336,2,8,4,4,balanced,0.07690666615962982
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,4096,14336,2,8,2,8,power_law_1.2,0.11311359405517578
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,4096,14336,2,8,4,4,balanced,0.08620267113049825
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,4096,14336,2,8,4,4,balanced,0.2949440081914266
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,4096,14336,2,8,2,8,power_law_1.2,0.12111999988555908
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,4096,14336,2,8,4,4,balanced,0.09995200236638387
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,4096,14336,2,8,4,4,balanced,0.4261386791865031
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,4096,14336,2,8,2,8,power_law_1.2,0.14398720264434814
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,4096,14336,2,8,4,4,balanced,0.11934933066368103
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,4096,14336,2,8,4,4,balanced,0.13513599832852682
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,4096,14336,2,8,4,4,balanced,0.5202720165252686
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,4096,14336,2,8,2,8,power_law_1.2,0.20207359790802001
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,4096,14336,2,8,4,4,balanced,0.18631466229756674
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,4096,14336,2,8,2,8,power_law_1.2,0.25927679538726806
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,4096,14336,2,8,4,4,balanced,0.7779200077056885
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,4096,14336,2,8,4,4,balanced,0.23504000902175903
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,4096,14336,2,8,2,8,power_law_1.2,0.3423680067062378
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,4096,14336,2,8,4,4,balanced,0.3312319914499919
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,4096,14336,2,8,4,4,balanced,1.002021312713623
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,4096,14336,2,8,2,8,power_law_1.2,0.48209280967712403
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,4096,14336,2,8,4,4,balanced,0.39800532658894855
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,4096,14336,2,8,2,8,power_law_1.2,0.731059217453003
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,4096,14336,2,8,4,4,power_law_1.01,0.05702400207519531
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,4096,14336,2,8,2,8,power_law_1.2,0.8925312042236329
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,4096,14336,2,8,4,4,balanced,0.5842186609903971
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,4096,14336,2,8,4,4,balanced,1.219765345255534
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,4096,14336,2,8,4,4,balanced,0.032746667663256325
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,4096,14336,2,8,4,4,power_law_1.01,0.06306560039520263
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,4096,14336,2,8,2,8,power_law_1.2,1.4114303588867188
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,4096,14336,2,8,4,4,balanced,0.0322773332397143
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,4096,14336,2,8,4,4,power_law_1.01,0.05395200252532959
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,4096,14336,2,8,4,4,balanced,0.7514399687449137
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,4096,14336,2,8,2,8,power_law_1.2,1.7274368286132813
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,4096,14336,2,8,4,4,balanced,0.04491733511288961
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,4096,14336,2,8,4,4,power_law_1.01,0.06751999855041504
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,4096,14336,2,8,4,4,balanced,0.04810666541258494
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,4096,14336,2,8,2,8,power_law_1.2,2.611078453063965
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,4096,14336,2,8,4,4,power_law_1.01,0.06837120056152343
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,4096,14336,2,8,4,4,balanced,1.9570612907409668
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,4096,14336,2,8,4,4,balanced,0.04927466809749603
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,4096,14336,2,8,4,4,power_law_1.01,0.07301759719848633
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,4096,14336,2,8,4,4,balanced,0.9174239635467529
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,4096,14336,2,8,2,8,power_law_1.2,3.437299346923828
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,4096,14336,2,8,4,4,power_law_1.01,0.08012800216674805
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,4096,14336,2,8,4,4,balanced,0.04948266843954722
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,4096,14336,2,8,2,8,power_law_1.2,4.096160125732422
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,4096,14336,2,8,4,4,power_law_1.01,0.07796480059623719
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,4096,14336,2,8,4,4,balanced,0.050111999114354454
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,4096,14336,2,8,4,4,power_law_1.01,0.07790079712867737
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,4096,14336,2,8,4,4,balanced,0.04993600149949392
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,4096,14336,2,8,2,8,power_law_1.2,6.86968994140625
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,4096,14336,2,8,4,4,power_law_1.01,0.5108352184295655
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,4096,14336,2,8,4,4,balanced,1.4554346402486165
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,4096,14336,2,8,4,4,power_law_1.01,0.08900480270385742
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,4096,14336,2,8,2,8,power_law_1.2,13.680256652832032
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,4096,14336,2,8,4,4,power_law_1.01,0.092467200756073
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,4096,14336,2,8,4,4,balanced,0.053183997670809426
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,4096,14336,2,8,4,4,balanced,3.8394880294799805
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,4096,14336,2,8,4,4,power_law_1.01,0.09934080243110657
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,4096,14336,2,8,4,4,balanced,0.05406400064627329
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,4096,14336,2,8,4,4,power_law_1.01,0.11099519729614257
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,4096,14336,2,8,4,4,power_law_1.01,0.13646080493927001
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,4096,14336,2,8,4,4,power_law_1.01,0.1362239956855774
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,4096,14336,2,8,4,4,power_law_1.01,0.13950719833374023
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,4096,14336,2,8,4,4,balanced,2.840949376424154
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,4096,14336,2,8,4,4,power_law_1.01,0.19427839517593384
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,4096,14336,2,8,4,4,balanced,0.05295466880003611
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,4096,14336,2,8,4,4,power_law_1.01,0.2740607976913452
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,4096,14336,2,8,4,4,balanced,0.05406400064627329
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,4096,14336,2,8,4,4,power_law_1.01,0.38699519634246826
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,4096,14336,2,8,4,4,power_law_1.01,0.048742398619651794
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,4096,14336,2,8,4,4,balanced,0.05562133093674978
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,4096,14336,2,8,4,4,power_law_1.01,0.30971519947052
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,4096,14336,2,8,4,4,power_law_1.01,0.04407039880752563
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,4096,14336,2,8,4,4,balanced,0.0555626650651296
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,4096,14336,2,8,4,4,power_law_1.01,0.04576640129089356
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,4096,14336,2,8,4,4,power_law_1.01,0.5230400085449218
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,4096,14336,2,8,4,4,power_law_1.01,0.05325440168380737
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,4096,14336,2,8,4,4,power_law_1.01,0.6674752235412598
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,4096,14336,2,8,4,4,power_law_1.01,0.05326719880104065
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,4096,14336,2,8,4,4,power_law_1.01,0.7955647945404053
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,4096,14336,2,8,4,4,power_law_1.01,0.05605120062828064
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,4096,14336,2,8,4,4,power_law_1.01,1.196735954284668
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,4096,14336,2,8,4,4,power_law_1.01,0.058745598793029784
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,4096,14336,2,8,4,4,power_law_1.01,1.7037439346313477
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,4096,14336,2,8,4,4,balanced,0.0641599992911021
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,4096,14336,2,8,4,4,power_law_1.01,0.06111360192298889
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,4096,14336,2,8,4,4,power_law_1.01,2.4561344146728517
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,4096,14336,2,8,4,4,balanced,0.0652213344971339
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,4096,14336,2,8,4,4,power_law_1.01,0.06415359973907471
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,4096,14336,2,8,4,4,balanced,0.06750399867693584
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,4096,14336,2,8,4,4,power_law_1.01,3.8476734161376953
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,4096,14336,2,8,4,4,power_law_1.01,0.039878401160240176
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,4096,14336,2,8,4,4,balanced,0.08814932902654012
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,4096,14336,2,8,4,4,power_law_1.01,0.06410880088806152
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,4096,14336,2,8,4,4,power_law_1.01,5.073171234130859
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,4096,14336,2,8,4,4,power_law_1.01,0.04053759872913361
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,4096,14336,2,8,4,4,balanced,0.09412800272305806
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,4096,14336,2,8,4,4,power_law_1.01,0.06681600213050842
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,4096,14336,2,8,4,4,power_law_1.01,0.0409855991601944
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,4096,14336,2,8,4,4,power_law_1.01,0.047788798809051514
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,4096,14336,2,8,4,4,power_law_1.01,0.06941440105438232
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,4096,14336,2,8,4,4,power_law_1.01,9.74877471923828
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,4096,14336,2,8,4,4,power_law_1.01,0.04847359955310822
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,4096,14336,2,8,4,4,power_law_1.01,0.07319679856300354
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,4096,14336,2,8,4,4,power_law_1.01,0.05126399993896484
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,4096,14336,2,8,4,4,power_law_1.01,0.058931201696395874
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,4096,14336,2,8,4,4,power_law_1.2,0.06213120222091675
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,4096,14336,2,8,4,4,balanced,0.12776000301043192
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,4096,14336,2,8,4,4,power_law_1.01,0.07614719867706299
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,4096,14336,2,8,4,4,power_law_1.01,0.06323199868202209
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,4096,14336,2,8,4,4,power_law_1.2,0.06280320286750793
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,4096,14336,2,8,4,4,power_law_1.01,0.091430401802063
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,4096,14336,2,8,4,4,balanced,0.15635733803113303
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,4096,14336,2,8,4,4,power_law_1.01,0.0651968002319336
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,4096,14336,2,8,4,4,power_law_1.2,0.0599295973777771
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,4096,14336,2,8,4,4,power_law_1.01,0.09296640157699584
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,4096,14336,2,8,4,4,power_law_1.01,0.06798719763755798
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,4096,14336,2,8,4,4,balanced,0.22012799978256226
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,4096,14336,2,8,4,4,power_law_1.2,0.06791679859161377
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,4096,14336,2,8,4,4,power_law_1.01,0.11371519565582275
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,4096,14336,2,8,4,4,balanced,0.27726932366689044
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,4096,14336,2,8,4,4,power_law_1.2,0.06875519752502442
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,4096,14336,2,8,4,4,power_law_1.01,0.06082559823989868
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,4096,14336,2,8,4,4,power_law_1.01,0.12888959646224976
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,4096,14336,2,8,4,4,power_law_1.2,0.07214080095291138
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,4096,14336,2,8,4,4,power_law_1.01,0.06764159798622131
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,4096,14336,2,8,4,4,power_law_1.01,0.1802623987197876
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,4096,14336,2,8,4,4,power_law_1.2,0.07567999958992004
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,4096,14336,2,8,4,4,power_law_1.01,0.07244160175323486
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,4096,14336,2,8,4,4,power_law_1.01,0.08589439988136291
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,4096,14336,2,8,4,4,power_law_1.2,0.07836800217628478
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,4096,14336,2,8,4,4,power_law_1.01,0.19659520387649537
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,4096,14336,2,8,4,4,balanced,0.43535999457041424
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,4096,14336,2,8,4,4,power_law_1.2,0.22313599586486815
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,4096,14336,2,8,4,4,power_law_1.01,0.23495039939880372
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,4096,14336,2,8,4,4,power_law_1.01,0.0866815984249115
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,4096,14336,2,8,4,4,power_law_1.2,0.7939712047576905
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,4096,14336,2,8,4,4,power_law_1.01,0.31152639389038084
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,4096,14336,2,8,4,4,power_law_1.01,0.08913919925689698
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,4096,14336,2,8,4,4,balanced,0.5777546564737955
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,4096,14336,2,8,4,4,power_law_1.2,0.08849279880523682
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,4096,14336,2,8,4,4,power_law_1.01,0.11669119596481323
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,4096,14336,2,8,4,4,power_law_1.01,0.4366720199584961
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,4096,14336,2,8,4,4,power_law_1.01,0.1356287956237793
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,4096,14336,2,8,4,4,power_law_1.2,0.0884223997592926
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,4096,14336,2,8,4,4,power_law_1.01,0.6622464179992675
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,4096,14336,2,8,4,4,power_law_1.01,0.1847615957260132
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,4096,14336,2,8,4,4,power_law_1.2,0.09874560236930847
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,4096,14336,2,8,4,4,balanced,0.8639732996622721
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,4096,14336,2,8,4,4,power_law_1.01,0.2965951919555664
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,4096,14336,2,8,4,4,power_law_1.01,0.7938047885894776
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,4096,14336,2,8,4,4,power_law_1.2,0.10842880010604858
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,4096,14336,2,8,4,4,power_law_1.01,0.3518208026885986
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,4096,14336,2,8,4,4,power_law_1.2,0.1333567976951599
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,4096,14336,2,8,4,4,power_law_1.01,1.1831295967102051
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,4096,14336,2,8,4,4,power_law_1.01,0.5154047966003418
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,4096,14336,2,8,4,4,balanced,1.146890640258789
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,4096,14336,2,8,4,4,power_law_1.2,0.12753280401229858
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,4096,14336,2,8,4,4,power_law_1.01,0.5998591899871826
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,4096,14336,2,8,4,4,power_law_1.01,1.9213312149047852
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,4096,14336,2,8,4,4,power_law_1.2,0.1607103943824768
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,4096,14336,2,8,4,4,power_law_1.01,2.0392831802368163
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,4096,14336,2,8,4,4,power_law_1.01,1.0489407539367677
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,4096,14336,2,8,4,4,power_law_1.2,0.1832576036453247
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,4096,14336,2,8,4,4,power_law_1.01,1.560102367401123
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,4096,14336,2,8,4,4,balanced,1.4103412628173828
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,4096,14336,2,8,4,4,power_law_1.01,2.9839168548583985
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,4096,14336,2,8,4,4,power_law_1.2,0.3099136114120483
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,4096,14336,2,8,4,4,power_law_1.01,2.3954687118530273
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,4096,14336,2,8,4,4,power_law_1.2,0.46586241722106936
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,4096,14336,2,8,4,4,power_law_1.01,5.971481704711914
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,4096,14336,2,8,4,4,power_law_1.01,2.6715072631835937
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,4096,14336,2,8,4,4,power_law_1.2,0.5081727981567383
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,4096,14336,2,8,4,4,power_law_1.01,3.285939025878906
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,4096,14336,2,8,4,4,power_law_1.2,0.6985983848571777
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,4096,14336,2,8,4,4,power_law_1.01,5.451551818847657
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,4096,14336,2,8,4,4,power_law_1.2,0.5751552104949951
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,4096,14336,2,8,4,4,balanced,2.2512693405151367
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,4096,14336,2,8,4,4,power_law_1.01,12.806541442871094
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,4096,14336,2,8,4,4,power_law_1.2,0.9697792053222656
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,4096,14336,2,8,4,4,power_law_1.2,1.5322175979614259
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,4096,14336,2,8,4,4,power_law_1.2,1.7692096710205079
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,4096,14336,2,8,4,4,power_law_1.2,2.9244543075561524
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,4096,14336,2,8,4,4,power_law_1.2,3.6144065856933594
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,4096,14336,2,8,4,4,balanced,4.467263857523601
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,4096,14336,2,8,4,4,power_law_1.2,5.4663551330566404
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,4096,14336,2,8,4,4,power_law_1.2,12.990170288085938
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,4096,14336,2,8,4,4,power_law_1.2,0.05240319967269898
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,4096,14336,2,8,4,4,power_law_1.2,0.051052802801132204
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,4096,14336,2,8,4,4,power_law_1.2,0.04588800072669983
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,4096,14336,2,8,4,4,power_law_1.2,0.04041599929332733
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,4096,14336,2,8,4,4,power_law_1.2,0.052960002422332765
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,4096,14336,2,8,4,4,power_law_1.2,0.05329279899597168
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,4096,14336,2,8,4,4,power_law_1.2,0.043059200048446655
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,4096,14336,2,8,4,4,power_law_1.2,0.057555198669433594
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,4096,14336,2,8,4,4,power_law_1.2,0.043993601202964784
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,4096,14336,2,8,4,4,power_law_1.2,0.06063359975814819
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,4096,14336,2,8,8,2,balanced,0.04026666780312856
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,4096,14336,2,8,4,4,power_law_1.2,0.047865599393844604
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,4096,14336,2,8,4,4,power_law_1.2,0.04951040148735046
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,4096,14336,2,8,4,4,power_law_1.2,0.06156799793243408
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,4096,14336,2,8,8,2,balanced,0.04916800061861674
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,4096,14336,2,8,4,4,power_law_1.2,0.06356480121612548
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,4096,14336,2,8,4,4,power_law_1.2,0.05448960065841675
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,4096,14336,2,8,8,2,balanced,0.06593599915504456
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,4096,14336,2,8,4,4,power_law_1.2,0.06650879979133606
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,4096,14336,2,8,4,4,power_law_1.2,0.060038399696350095
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,4096,14336,2,8,8,2,balanced,0.06934399902820587
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,4096,14336,2,8,4,4,power_law_1.2,0.06718080043792725
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,4096,14336,2,8,8,2,balanced,0.06901866694291432
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,4096,14336,2,8,4,4,power_law_1.2,0.060844802856445314
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,4096,14336,2,8,4,4,power_law_1.2,0.06824960112571717
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,4096,14336,2,8,8,2,balanced,0.07045333087444305
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,4096,14336,2,8,4,4,power_law_1.2,0.07146239876747132
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,4096,14336,2,8,4,4,power_law_1.2,0.06649600267410279
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,4096,14336,2,8,8,2,balanced,0.07074133555094402
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,4096,14336,2,8,8,2,balanced,0.07090133428573608
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,4096,14336,2,8,4,4,power_law_1.2,0.06821759939193725
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,4096,14336,2,8,4,4,power_law_1.2,0.08252800107002259
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,4096,14336,2,8,8,2,balanced,0.07361066838105519
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,4096,14336,2,8,4,4,power_law_1.2,0.08850560188293458
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,4096,14336,2,8,8,2,balanced,0.0735999991496404
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,4096,14336,2,8,4,4,power_law_1.2,0.1043776035308838
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,4096,14336,2,8,4,4,power_law_1.2,0.06231679916381836
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,4096,14336,2,8,8,2,balanced,0.07497600217660268
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,4096,14336,2,8,4,4,power_law_1.2,0.11401599645614624
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,4096,14336,2,8,4,4,power_law_1.2,0.07425919771194459
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,4096,14336,2,8,8,2,balanced,0.07642666498819987
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,4096,14336,2,8,4,4,power_law_1.2,0.12739200592041017
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,4096,14336,2,8,4,4,power_law_1.2,0.07116159796714783
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,4096,14336,2,8,8,2,balanced,0.07717333237330119
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,4096,14336,2,8,8,2,balanced,0.03469333300987879
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,4096,14336,2,8,4,4,power_law_1.2,0.16652159690856932
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,4096,14336,2,8,4,4,power_law_1.2,0.08273280262947083
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,4096,14336,2,8,8,2,balanced,0.08536000053087871
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,4096,14336,2,8,4,4,power_law_1.2,0.24735360145568847
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,4096,14336,2,8,8,2,balanced,0.03699733316898346
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,4096,14336,2,8,8,2,balanced,0.08686932921409607
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,4096,14336,2,8,4,4,power_law_1.2,0.24729599952697753
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,4096,14336,2,8,8,2,balanced,0.049914668003718056
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,4096,14336,2,8,8,2,balanced,0.08797333637873332
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,4096,14336,2,8,4,4,power_law_1.2,0.37487359046936036
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,4096,14336,2,8,4,4,power_law_1.2,0.09685760140419006
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,4096,14336,2,8,8,2,balanced,0.05259733398755392
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,4096,14336,2,8,8,2,balanced,0.10335466265678406
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,4096,14336,2,8,4,4,power_law_1.2,0.427891206741333
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,4096,14336,2,8,8,2,balanced,0.0536053329706192
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,4096,14336,2,8,4,4,power_law_1.2,0.10213760137557984
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,4096,14336,2,8,8,2,balanced,0.10685867071151733
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,4096,14336,2,8,8,2,balanced,0.05395199855168661
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,4096,14336,2,8,4,4,power_law_1.2,0.12692480087280272
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,4096,14336,2,8,4,4,power_law_1.2,0.7647039890289307
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,4096,14336,2,8,8,2,balanced,0.11275733510653178
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,4096,14336,2,8,8,2,balanced,0.054474666714668274
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,4096,14336,2,8,4,4,power_law_1.2,0.8974847793579102
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,4096,14336,2,8,4,4,power_law_1.2,0.1751039981842041
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,4096,14336,2,8,8,2,balanced,0.1677066683769226
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,4096,14336,2,8,8,2,balanced,0.054901331663131714
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,4096,14336,2,8,4,4,power_law_1.2,1.376582431793213
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,4096,14336,2,8,4,4,power_law_1.2,0.18773759603500367
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,4096,14336,2,8,8,2,balanced,0.1832053263982137
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,4096,14336,2,8,8,2,balanced,0.05517866710821787
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,4096,14336,2,8,4,4,power_law_1.2,1.8342912673950196
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,4096,14336,2,8,8,2,balanced,0.25970667600631714
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,4096,14336,2,8,4,4,power_law_1.2,0.3053247928619385
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,4096,14336,2,8,8,2,balanced,0.0557226687669754
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,4096,14336,2,8,4,4,power_law_1.2,2.1080575942993165
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,4096,14336,2,8,8,2,balanced,0.32184000809987384
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,4096,14336,2,8,4,4,power_law_1.2,0.46300158500671384
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,4096,14336,2,8,8,2,balanced,0.05682666599750519
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,4096,14336,2,8,4,4,power_law_1.2,2.895039939880371
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,4096,14336,2,8,8,2,balanced,0.05760000149408976
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,4096,14336,2,8,4,4,power_law_1.2,0.601907205581665
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,4096,14336,2,8,8,2,balanced,0.4646186828613281
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,4096,14336,2,8,8,2,balanced,0.058186665177345276
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,4096,14336,2,8,4,4,power_law_1.2,0.8295231819152832
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,4096,14336,2,8,4,4,power_law_1.2,6.934105682373047
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,4096,14336,2,8,8,2,balanced,0.5607999960581461
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,4096,14336,2,8,8,2,balanced,0.06321600079536438
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,4096,14336,2,8,4,4,power_law_1.2,1.148582363128662
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,4096,14336,2,8,8,2,balanced,0.06889600058396657
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,4096,14336,2,8,8,2,balanced,0.8418400287628174
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,4096,14336,2,8,4,4,power_law_1.2,1.8544063568115234
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,4096,14336,2,8,8,2,balanced,0.06814399858315785
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,4096,14336,2,8,8,2,balanced,0.07483733197053273
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,4096,14336,2,8,4,4,power_law_1.2,2.228339195251465
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,4096,14336,2,8,8,2,balanced,0.08729066451390584
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,4096,14336,2,8,8,2,balanced,1.0980106989542644
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,4096,14336,2,8,4,4,power_law_1.2,2.524563217163086
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,4096,14336,2,8,8,2,balanced,0.09616000453631084
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,4096,14336,2,8,4,4,power_law_1.2,4.049299240112305
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,4096,14336,2,8,8,2,balanced,0.12463466326395671
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,4096,14336,2,8,8,2,balanced,1.3549599647521973
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,4096,14336,2,8,4,4,power_law_1.2,6.2591808319091795
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,4096,14336,2,8,8,2,balanced,0.14848533272743225
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,4096,14336,2,8,8,2,power_law_1.01,0.048390400409698484
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,4096,14336,2,8,8,2,balanced,0.2056480050086975
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,4096,14336,2,8,4,4,power_law_1.2,11.33531494140625
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,4096,14336,2,8,8,2,power_law_1.01,0.05252479910850525
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,4096,14336,2,8,8,2,balanced,0.2595040003458659
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,4096,14336,2,8,8,2,power_law_1.01,0.05936639904975891
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,4096,14336,2,8,8,2,balanced,2.127829392751058
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,4096,14336,2,8,8,2,power_law_1.01,0.06805760264396668
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,4096,14336,2,8,8,2,balanced,0.36717867851257324
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,4096,14336,2,8,8,2,power_law_1.01,0.0679423987865448
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,4096,14336,2,8,8,2,power_law_1.01,0.07217280268669128
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,4096,14336,2,8,8,2,balanced,0.45371735095977783
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,4096,14336,2,8,8,2,power_law_1.01,0.03500159978866577
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,4096,14336,2,8,8,2,balanced,0.02741866558790207
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,4096,14336,2,8,8,2,power_law_1.01,0.07637119889259339
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,4096,14336,2,8,8,2,power_law_1.01,0.039129599928855896
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,4096,14336,2,8,8,2,power_law_1.01,0.07830399870872498
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,4096,14336,2,8,8,2,balanced,0.031471999982992806
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,4096,14336,2,8,8,2,balanced,0.6655199925104777
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,4096,14336,2,8,8,2,balanced,0.04423466821511587
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,4096,14336,2,8,8,2,power_law_1.01,0.040889599919319154
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,4096,14336,2,8,8,2,power_law_1.01,0.3598848104476929
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,4096,14336,2,8,8,2,balanced,0.047322665651639305
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,4096,14336,2,8,8,2,power_law_1.01,0.05139200091361999
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,4096,14336,2,8,8,2,balanced,0.04850666721661886
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,4096,14336,2,8,8,2,power_law_1.01,0.07894399762153625
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,4096,14336,2,8,8,2,balanced,4.127349217732747
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,4096,14336,2,8,8,2,balanced,0.049285332361857094
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,4096,14336,2,8,8,2,balanced,0.8604746659596761
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,4096,14336,2,8,8,2,power_law_1.01,0.050758397579193114
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,4096,14336,2,8,8,2,power_law_1.01,0.08849920034408569
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,4096,14336,2,8,8,2,balanced,0.049413333336512245
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,4096,14336,2,8,8,2,power_law_1.01,0.05322880148887634
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,4096,14336,2,8,8,2,balanced,0.049685334165891014
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,4096,14336,2,8,8,2,power_law_1.01,0.08919039964675904
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,4096,14336,2,8,8,2,power_law_1.01,0.05377920269966126
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,4096,14336,2,8,8,2,power_law_1.01,0.09285759925842285
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,4096,14336,2,8,8,2,balanced,1.054752031962077
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,4096,14336,2,8,8,2,power_law_1.01,0.059359997510910034
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,4096,14336,2,8,8,2,power_law_1.01,0.10909440517425537
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,4096,14336,2,8,8,2,power_law_1.01,0.06037120223045349
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,4096,14336,2,8,8,2,power_law_1.01,0.1158336043357849
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,4096,14336,2,8,8,2,balanced,0.05051200091838837
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,4096,14336,2,8,8,2,power_law_1.01,0.05978879928588867
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,4096,14336,2,8,8,2,power_law_1.01,0.11498240232467652
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,4096,14336,2,8,8,2,power_law_1.01,0.030246400833129884
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,4096,14336,2,8,8,2,balanced,0.05188799897829691
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,4096,14336,2,8,8,2,power_law_1.01,0.06219519972801209
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,4096,14336,2,8,8,2,power_law_1.01,0.11192959547042847
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,4096,14336,2,8,8,2,power_law_1.01,0.033580800890922545
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,4096,14336,2,8,8,2,balanced,1.6954186757405598
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,4096,14336,2,8,8,2,power_law_1.01,0.06503040194511414
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,4096,14336,2,8,8,2,power_law_1.01,0.1572991967201233
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,4096,14336,2,8,8,2,power_law_1.01,0.036908799409866334
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,4096,14336,2,8,8,2,power_law_1.01,0.06643199920654297
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,4096,14336,2,8,8,2,power_law_1.01,0.0482367992401123
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,4096,14336,2,8,8,2,power_law_1.01,0.17329920530319215
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,4096,14336,2,8,8,2,power_law_1.01,0.07736319899559022
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,4096,14336,2,8,8,2,power_law_1.01,0.04785279929637909
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,4096,14336,2,8,8,2,power_law_1.01,0.23345279693603516
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,4096,14336,2,8,8,2,power_law_1.01,0.08293120265007019
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,4096,14336,2,8,8,2,power_law_1.01,0.052665597200393675
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,4096,14336,2,8,8,2,power_law_1.01,0.2715840101242065
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,4096,14336,2,8,8,2,power_law_1.01,0.08520320057868958
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,4096,14336,2,8,8,2,power_law_1.01,0.05658239722251892
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,4096,14336,2,8,8,2,power_law_1.01,0.35479040145874025
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,4096,14336,2,8,8,2,power_law_1.01,0.0945472002029419
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,4096,14336,2,8,8,2,power_law_1.01,0.42211198806762695
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,4096,14336,2,8,8,2,power_law_1.01,0.05856000185012818
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,4096,14336,2,8,8,2,power_law_1.01,0.1122431993484497
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,4096,14336,2,8,8,2,balanced,0.05398933092753092
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,4096,14336,2,8,8,2,power_law_1.01,0.6742208003997803
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,4096,14336,2,8,8,2,power_law_1.01,0.13343360424041747
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,4096,14336,2,8,8,2,balanced,3.2330506642659507
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,4096,14336,2,8,8,2,balanced,0.05565866827964783
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,4096,14336,2,8,8,2,power_law_1.01,0.7850560188293457
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,4096,14336,2,8,8,2,balanced,0.057850668827692665
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,4096,14336,2,8,8,2,power_law_1.01,0.164300799369812
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,4096,14336,2,8,8,2,power_law_1.01,0.061638402938842776
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,4096,14336,2,8,8,2,balanced,0.05902933577696482
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,4096,14336,2,8,8,2,power_law_1.01,0.19889919757843016
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,4096,14336,2,8,8,2,power_law_1.01,1.4315008163452148
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,4096,14336,2,8,8,2,power_law_1.01,0.06082559823989868
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,4096,14336,2,8,8,2,power_law_1.01,0.28257920742034914
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,4096,14336,2,8,8,2,power_law_1.01,1.8439296722412108
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,4096,14336,2,8,8,2,power_law_1.01,0.3328831911087036
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,4096,14336,2,8,8,2,power_law_1.01,1.9135040283203124
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,4096,14336,2,8,8,2,balanced,0.06834666430950165
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,4096,14336,2,8,8,2,power_law_1.01,0.06427519917488098
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,4096,14336,2,8,8,2,power_law_1.01,0.4834303855895996
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,4096,14336,2,8,8,2,power_law_1.01,3.161235237121582
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,4096,14336,2,8,8,2,balanced,0.06977599859237671
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,4096,14336,2,8,8,2,power_law_1.01,0.06714879870414733
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,4096,14336,2,8,8,2,power_law_1.01,0.5793600082397461
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,4096,14336,2,8,8,2,balanced,0.07470933099587758
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,4096,14336,2,8,8,2,power_law_1.01,0.07012479901313781
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,4096,14336,2,8,8,2,power_law_1.01,6.308012771606445
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,4096,14336,2,8,8,2,power_law_1.01,0.8015680313110352
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,4096,14336,2,8,8,2,balanced,0.099589337905248
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,4096,14336,2,8,8,2,balanced,0.10749866565068562
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,4096,14336,2,8,8,2,power_law_1.01,0.07596160173416137
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,4096,14336,2,8,8,2,power_law_1.01,1.331283187866211
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,4096,14336,2,8,8,2,balanced,0.1462453305721283
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,4096,14336,2,8,8,2,power_law_1.01,1.5752063751220704
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,4096,14336,2,8,8,2,power_law_1.01,0.08739839792251587
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,4096,14336,2,8,8,2,balanced,0.1836693286895752
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,4096,14336,2,8,8,2,power_law_1.01,2.6747135162353515
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,4096,14336,2,8,8,2,power_law_1.01,0.09410560131072998
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,4096,14336,2,8,8,2,balanced,0.2712480028470357
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,4096,14336,2,8,8,2,power_law_1.01,0.09867519736289979
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,4096,14336,2,8,8,2,balanced,0.3569493293762207
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,4096,14336,2,8,8,2,power_law_1.01,4.700339126586914
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,4096,14336,2,8,8,2,power_law_1.01,0.13826559782028197
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,4096,14336,2,8,8,2,power_law_1.01,0.14636160135269166
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,4096,14336,2,8,8,2,power_law_1.01,0.224236798286438
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,4096,14336,2,8,8,2,power_law_1.01,0.2849024057388306
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,4096,14336,2,8,8,2,balanced,0.5472906827926636
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,4096,14336,2,8,8,2,power_law_1.01,0.40625920295715334
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,4096,14336,2,8,8,2,balanced,0.715440034866333
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,4096,14336,2,8,8,2,power_law_1.01,0.5822080135345459
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,4096,14336,2,8,8,2,balanced,1.0657707055409749
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,4096,14336,2,8,8,2,power_law_1.01,0.8500415802001953
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,4096,14336,2,8,8,2,power_law_1.01,1.1094143867492676
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,4096,14336,2,8,8,2,power_law_1.01,1.3984959602355957
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,4096,14336,2,8,8,2,balanced,1.4060427347819011
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,4096,14336,2,8,8,2,power_law_1.01,1.895680046081543
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,4096,14336,2,8,8,2,power_law_1.2,0.04276480078697205
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,4096,14336,2,8,8,2,power_law_1.01,2.4617984771728514
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,4096,14336,2,8,8,2,balanced,1.7394240697224934
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,4096,14336,2,8,8,2,power_law_1.2,0.04798080027103424
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,4096,14336,2,8,8,2,power_law_1.01,4.405612945556641
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,4096,14336,2,8,8,2,power_law_1.2,0.05324800014495849
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,4096,14336,2,8,8,2,power_law_1.01,8.940230560302734
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,4096,14336,2,8,8,2,power_law_1.2,0.06846079826354981
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,4096,14336,2,8,8,2,power_law_1.2,0.06759679913520814
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,4096,14336,2,8,8,2,balanced,2.769440015157064
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,4096,14336,2,8,8,2,power_law_1.2,0.0717631995677948
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,4096,14336,2,8,8,2,power_law_1.2,0.03743999898433685
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,4096,14336,2,8,8,2,power_law_1.2,0.07317759990692138
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,4096,14336,2,8,8,2,power_law_1.2,0.0383103996515274
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,4096,14336,2,8,8,2,power_law_1.2,0.07751039862632751
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,4096,14336,2,8,8,2,power_law_1.2,0.04168320000171662
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,4096,14336,2,8,8,2,power_law_1.2,0.36436479091644286
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,4096,14336,2,8,8,2,power_law_1.2,0.05134080052375793
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,4096,14336,2,8,8,2,power_law_1.2,0.7933824062347412
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,4096,14336,2,8,8,2,power_law_1.2,0.052934402227401735
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,4096,14336,2,8,8,2,power_law_1.2,0.08569599986076355
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,4096,14336,2,8,8,2,power_law_1.2,0.054745602607727054
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,4096,14336,2,8,8,2,power_law_1.2,0.08948479890823365
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,4096,14336,2,8,8,2,balanced,5.484426498413086
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,4096,14336,2,8,8,2,power_law_1.2,0.0572160005569458
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,4096,14336,2,8,8,2,power_law_1.2,0.09056640267372132
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,4096,14336,2,8,8,2,power_law_1.2,0.058963197469711306
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,4096,14336,2,8,8,2,power_law_1.2,0.06035839915275574
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,4096,14336,2,8,8,2,power_law_1.2,0.10902400016784668
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,4096,14336,2,8,8,2,power_law_1.2,0.060787200927734375
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,4096,14336,2,8,8,2,power_law_1.2,0.11521919965744018
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,4096,14336,2,8,8,2,power_law_1.2,0.06537600159645081
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,4096,14336,2,8,8,2,power_law_1.2,0.11932159662246704
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,4096,14336,2,8,8,2,power_law_1.2,0.06609920263290406
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,4096,14336,2,8,8,2,power_law_1.2,0.11943039894104004
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,4096,14336,2,8,8,2,power_law_1.2,0.06646400094032287
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,4096,14336,2,8,8,2,power_law_1.2,0.1569216012954712
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,4096,14336,2,8,8,2,power_law_1.2,0.07953919768333435
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,4096,14336,2,8,8,2,power_law_1.2,0.08503680229187012
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,4096,14336,2,8,8,2,power_law_1.2,0.18006399869918824
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,4096,14336,2,8,8,2,power_law_1.2,0.030822399258613586
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,4096,14336,2,8,8,2,power_law_1.2,0.08556159734725952
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,4096,14336,2,8,8,2,power_law_1.2,0.21281919479370118
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,4096,14336,2,8,8,2,power_law_1.2,0.03555200099945068
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,4096,14336,2,8,8,2,power_law_1.2,0.09523199796676636
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,4096,14336,2,8,8,2,power_law_1.2,0.2652224063873291
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,4096,14336,2,8,8,2,power_law_1.2,0.03372159898281098
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,4096,14336,2,8,8,2,power_law_1.2,0.04663040041923523
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,4096,14336,2,8,8,2,power_law_1.2,0.11498240232467652
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,4096,14336,2,8,8,2,power_law_1.2,0.4083456039428711
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,4096,14336,2,8,8,2,power_law_1.2,0.04837760031223297
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,4096,14336,2,8,8,2,power_law_1.2,0.055225598812103274
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,4096,14336,2,8,8,2,power_law_1.2,0.1249343991279602
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,4096,14336,2,8,8,2,power_law_1.2,0.44705920219421386
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,4096,14336,2,8,8,2,power_law_1.2,0.05768960118293762
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,4096,14336,2,8,8,2,power_law_1.2,0.1800320029258728
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,4096,14336,2,8,8,2,power_law_1.2,0.6367680072784424
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,4096,14336,2,8,8,2,power_law_1.2,0.056627202033996585
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,4096,14336,2,8,8,2,power_law_1.2,0.22584960460662842
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,4096,14336,2,8,8,2,power_law_1.2,0.9163071632385253
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,4096,14336,2,8,8,2,power_law_1.2,0.2599551916122437
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,4096,14336,2,8,8,2,power_law_1.2,0.059411197900772095
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,4096,14336,2,8,8,2,power_law_1.2,1.3385343551635742
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,4096,14336,2,8,8,2,power_law_1.2,0.34085760116577146
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,4096,14336,2,8,8,2,power_law_1.2,0.06177279949188232
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,4096,14336,2,8,8,2,power_law_1.2,1.967398452758789
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,4096,14336,2,8,8,2,power_law_1.2,0.5242368221282959
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,4096,14336,2,8,8,2,power_law_1.2,0.6764800071716308
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,4096,14336,2,8,8,2,power_law_1.2,2.530086326599121
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,4096,14336,2,8,8,2,power_law_1.2,0.06575999855995178
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,4096,14336,2,8,8,2,power_law_1.2,1.0144448280334473
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,4096,14336,2,8,8,2,power_law_1.2,0.06885120272636414
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,4096,14336,2,8,8,2,power_law_1.2,3.441740798950195
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,4096,14336,2,8,16,1,balanced,0.03950933367013931
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,4096,14336,2,8,8,2,power_law_1.2,0.06988160014152527
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,4096,14336,2,8,8,2,power_law_1.2,1.2237631797790527
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,4096,14336,2,8,8,2,power_law_1.2,0.0725055992603302
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,4096,14336,2,8,8,2,power_law_1.2,7.401152038574219
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,4096,14336,2,8,16,1,balanced,0.04854933420817057
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,4096,14336,2,8,8,2,power_law_1.2,1.7791807174682617
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,4096,14336,2,8,16,1,balanced,0.06247466802597046
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,4096,14336,2,8,8,2,power_law_1.2,0.08698239922523499
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,4096,14336,2,8,8,2,power_law_1.2,2.7582719802856444
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,4096,14336,2,8,16,1,balanced,0.0686773310105006
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,4096,14336,2,8,8,2,power_law_1.2,0.09196159839630128
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,4096,14336,2,8,8,2,power_law_1.2,0.09864320158958435
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,4096,14336,2,8,8,2,power_law_1.2,5.139801788330078
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,4096,14336,2,8,16,1,balanced,0.06564799944559734
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,4096,14336,2,8,8,2,power_law_1.2,0.1363584041595459
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,4096,14336,2,8,16,1,balanced,0.06715199848016103
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,4096,14336,2,8,8,2,power_law_1.2,0.16663039922714235
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,4096,14336,2,8,16,1,balanced,0.0674186646938324
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,4096,14336,2,8,16,1,balanced,0.03485333422819773
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,4096,14336,2,8,8,2,power_law_1.2,0.23503360748291016
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,4096,14336,2,8,8,2,power_law_1.2,0.30574080944061277
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,4096,14336,2,8,16,1,balanced,0.07146133482456207
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,4096,14336,2,8,16,1,balanced,0.03625600039958954
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,4096,14336,2,8,8,2,power_law_1.2,0.4013951778411865
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,4096,14336,2,8,16,1,balanced,0.07427200178305308
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,4096,14336,2,8,8,2,power_law_1.2,0.5638463973999024
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,4096,14336,2,8,16,1,balanced,0.05065600077311198
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,4096,14336,2,8,16,1,balanced,0.07442666590213776
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,4096,14336,2,8,16,1,balanced,0.05349333087603251
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,4096,14336,2,8,8,2,power_law_1.2,0.8552191734313965
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,4096,14336,2,8,16,1,balanced,0.07559999823570251
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,4096,14336,2,8,8,2,power_law_1.2,1.1830528259277344
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,4096,14336,2,8,16,1,balanced,0.05470933516820272
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,4096,14336,2,8,8,2,power_law_1.2,1.7684928894042968
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,4096,14336,2,8,16,1,balanced,0.07891199986139934
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,4096,14336,2,8,16,1,balanced,0.05552533268928528
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,4096,14336,2,8,8,2,power_law_1.2,2.096044731140137
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,4096,14336,2,8,16,1,balanced,0.07913066446781158
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,4096,14336,2,8,16,1,balanced,0.05597866574923197
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,4096,14336,2,8,8,2,power_law_1.2,2.8997631072998047
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,4096,14336,2,8,16,1,balanced,0.08400533596674602
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,4096,14336,2,8,16,1,balanced,0.05598933498064677
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,4096,14336,2,8,8,2,power_law_1.2,4.596076965332031
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,4096,14336,2,8,16,1,balanced,0.09115200241406758
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,4096,14336,2,8,16,1,balanced,0.05669866502285004
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,4096,14336,2,8,8,2,power_law_1.2,8.992198181152343
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,4096,14336,2,8,16,1,balanced,0.09178666273752849
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,4096,14336,2,8,16,1,balanced,0.0576800008614858
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,4096,14336,2,8,16,1,balanced,0.10346133510271709
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,4096,14336,2,8,16,1,balanced,0.058965335289637245
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,4096,14336,2,8,16,1,balanced,0.12784000237782797
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,4096,14336,2,8,16,1,balanced,0.060959999759991966
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,4096,14336,2,8,16,1,balanced,0.06214933097362518
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,4096,14336,2,8,16,1,balanced,0.12833600242932638
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,4096,14336,2,8,16,1,balanced,0.06693333387374878
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,4096,14336,2,8,16,1,balanced,0.1700800061225891
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,4096,14336,2,8,16,1,balanced,0.07351466516653697
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,4096,14336,2,8,16,1,balanced,0.20084265867869058
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,4096,14336,2,8,16,1,balanced,0.028005334238211315
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,4096,14336,2,8,16,1,balanced,0.07302399973074596
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,4096,14336,2,8,16,1,balanced,0.03067733347415924
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,4096,14336,2,8,16,1,balanced,0.2842400074005127
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,4096,14336,2,8,16,1,balanced,0.08331199983755748
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,4096,14336,2,8,16,1,balanced,0.045461331804593406
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,4096,14336,2,8,16,1,balanced,0.3660800059636434
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,4096,14336,2,8,16,1,balanced,0.10738666852315266
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,4096,14336,2,8,16,1,balanced,0.049029335379600525
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,4096,14336,2,8,16,1,balanced,0.11379200220108032
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,4096,14336,2,8,16,1,balanced,0.05039466420809428
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,4096,14336,2,8,16,1,balanced,0.5304746627807617
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,4096,14336,2,8,16,1,balanced,0.05102399984995524
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,4096,14336,2,8,16,1,balanced,0.1476959983507792
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,4096,14336,2,8,16,1,balanced,0.6635200182596842
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,4096,14336,2,8,16,1,balanced,0.052298665046691895
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,4096,14336,2,8,16,1,power_law_1.01,0.039654400944709775
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,4096,14336,2,8,16,1,balanced,0.17230399449666342
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,4096,14336,2,8,16,1,balanced,0.05264533559481303
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,4096,14336,2,8,16,1,power_law_1.01,0.04619520008563995
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,4096,14336,2,8,16,1,balanced,0.9957119623819987
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,4096,14336,2,8,16,1,balanced,0.24444266160329184
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,4096,14336,2,8,16,1,power_law_1.01,0.04624640047550201
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,4096,14336,2,8,16,1,balanced,0.3144853313763936
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,4096,14336,2,8,16,1,power_law_1.01,0.06664320230484008
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,4096,14336,2,8,16,1,balanced,1.2820213635762532
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,4096,14336,2,8,16,1,power_law_1.01,0.06470400094985962
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,4096,14336,2,8,16,1,balanced,0.05444799860318502
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,4096,14336,2,8,16,1,balanced,0.4610133171081543
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,4096,14336,2,8,16,1,power_law_1.01,0.06626560091972351
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,4096,14336,2,8,16,1,balanced,0.056474665800730385
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,4096,14336,2,8,16,1,balanced,0.5793173313140869
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,4096,14336,2,8,16,1,power_law_1.01,0.0723136007785797
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,4096,14336,2,8,16,1,power_law_1.01,0.03506560027599335
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,4096,14336,2,8,16,1,balanced,1.560698668162028
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,4096,14336,2,8,16,1,power_law_1.01,0.07711359858512878
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,4096,14336,2,8,16,1,power_law_1.01,0.03594239950180054
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,4096,14336,2,8,16,1,balanced,0.8547413349151611
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,4096,14336,2,8,16,1,power_law_1.01,0.7755072116851807
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,4096,14336,2,8,16,1,power_law_1.01,0.037567999958992
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,4096,14336,2,8,16,1,power_law_1.01,0.35916800498962403
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,4096,14336,2,8,16,1,power_law_1.01,0.052300798892974856
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,4096,14336,2,8,16,1,power_law_1.01,0.0782975971698761
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,4096,14336,2,8,16,1,power_law_1.01,0.053395199775695804
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,4096,14336,2,8,16,1,balanced,2.4709386825561523
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,4096,14336,2,8,16,1,balanced,1.093274672826131
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,4096,14336,2,8,16,1,balanced,0.059674665331840515
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,4096,14336,2,8,16,1,power_law_1.01,0.053881597518920896
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,4096,14336,2,8,16,1,power_law_1.01,0.08781440258026123
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,4096,14336,2,8,16,1,balanced,0.06285333136717479
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,4096,14336,2,8,16,1,power_law_1.01,0.05885440111160278
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,4096,14336,2,8,16,1,power_law_1.01,0.09044479727745056
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,4096,14336,2,8,16,1,balanced,0.06459733347098033
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,4096,14336,2,8,16,1,power_law_1.01,0.10273280143737792
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,4096,14336,2,8,16,1,power_law_1.01,0.05883520245552063
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,4096,14336,2,8,16,1,balanced,1.3456053733825684
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,4096,14336,2,8,16,1,balanced,0.06754133105278015
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,4096,14336,2,8,16,1,power_law_1.01,0.11434240341186523
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,4096,14336,2,8,16,1,power_law_1.01,0.06149119734764099
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,4096,14336,2,8,16,1,power_law_1.01,0.11980799436569214
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,4096,14336,2,8,16,1,power_law_1.01,0.061478400230407716
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,4096,14336,2,8,16,1,power_law_1.01,0.11424640417099
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,4096,14336,2,8,16,1,power_law_1.01,0.06262400150299072
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,4096,14336,2,8,16,1,power_law_1.01,0.15813119411468507
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,4096,14336,2,8,16,1,balanced,4.885973294576009
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,4096,14336,2,8,16,1,power_law_1.01,0.0659712016582489
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,4096,14336,2,8,16,1,balanced,2.187653382619222
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,4096,14336,2,8,16,1,balanced,0.07997333506743114
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,4096,14336,2,8,16,1,power_law_1.01,0.16147840023040771
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,4096,14336,2,8,16,1,power_law_1.01,0.06738560199737549
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,4096,14336,2,8,16,1,balanced,0.08335999647776286
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,4096,14336,2,8,16,1,power_law_1.01,0.1962048053741455
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,4096,14336,2,8,16,1,power_law_1.01,0.07694079875946044
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,4096,14336,2,8,16,1,balanced,0.09076799949010213
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,4096,14336,2,8,16,1,power_law_1.01,0.0884223997592926
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,4096,14336,2,8,16,1,power_law_1.01,0.21761279106140136
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,4096,14336,2,8,16,1,balanced,0.12559466560681662
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,4096,14336,2,8,16,1,power_law_1.01,0.08967040181159973
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,4096,14336,2,8,16,1,power_law_1.01,0.29663360118865967
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,4096,14336,2,8,16,1,balanced,0.13922133048375449
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,4096,14336,2,8,16,1,power_law_1.01,0.09103999733924865
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,4096,14336,2,8,16,1,power_law_1.01,0.37118079662323
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,4096,14336,2,8,16,1,balanced,0.1997493306795756
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,4096,14336,2,8,16,1,power_law_1.01,0.11110399961471558
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,4096,14336,2,8,16,1,power_law_1.01,0.5324607849121094
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,4096,14336,2,8,16,1,balanced,4.14302921295166
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,4096,14336,2,8,16,1,balanced,0.2731626629829407
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,4096,14336,2,8,16,1,power_law_1.01,0.1284608006477356
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,4096,14336,2,8,16,1,power_law_1.01,0.6805759906768799
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,4096,14336,2,8,16,1,power_law_1.01,0.16672639846801757
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,4096,14336,2,8,16,1,power_law_1.01,1.0133824348449707
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,4096,14336,2,8,16,1,balanced,0.3984053134918213
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,4096,14336,2,8,16,1,power_law_1.01,0.18529920578002929
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,4096,14336,2,8,16,1,power_law_1.01,1.3117952346801758
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,4096,14336,2,8,16,1,balanced,0.5138453245162964
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,4096,14336,2,8,16,1,power_law_1.01,0.25144960880279543
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,4096,14336,2,8,16,1,power_law_1.01,1.6386688232421875
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,4096,14336,2,8,16,1,power_law_1.01,0.029241600632667543
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,4096,14336,2,8,16,1,power_law_1.01,0.31685121059417726
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,4096,14336,2,8,16,1,power_law_1.01,2.468614387512207
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,4096,14336,2,8,16,1,power_law_1.01,0.031123200058937074
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,4096,14336,2,8,16,1,power_law_1.01,0.45548157691955565
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,4096,14336,2,8,16,1,power_law_1.01,4.817139053344727
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,4096,14336,2,8,16,1,power_law_1.01,0.0322816014289856
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,4096,14336,2,8,16,1,power_law_1.01,0.5757823944091797
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,4096,14336,2,8,16,1,balanced,0.772757371266683
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,4096,14336,2,8,16,1,power_law_1.01,0.04829440116882324
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,4096,14336,2,8,16,1,power_law_1.01,0.8387904167175293
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,4096,14336,2,8,16,1,power_law_1.2,0.03934719860553741
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,4096,14336,2,8,16,1,balanced,1.0109386444091797
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,4096,14336,2,8,16,1,power_law_1.01,0.04930559992790222
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,4096,14336,2,8,16,1,power_law_1.01,1.1043968200683594
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,4096,14336,2,8,16,1,power_law_1.2,0.04477440118789673
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,4096,14336,2,8,16,1,power_law_1.01,0.05089920163154602
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,4096,14336,2,8,16,1,power_law_1.01,1.397811222076416
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,4096,14336,2,8,16,1,power_law_1.2,0.04754559993743897
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,4096,14336,2,8,16,1,power_law_1.01,0.057011198997497556
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,4096,14336,2,8,16,1,balanced,1.4984052975972493
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,4096,14336,2,8,16,1,power_law_1.2,0.06687359809875489
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,4096,14336,2,8,16,1,power_law_1.01,2.215590476989746
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,4096,14336,2,8,16,1,power_law_1.01,0.058169597387313844
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,4096,14336,2,8,16,1,power_law_1.2,0.0638592004776001
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,4096,14336,2,8,16,1,power_law_1.01,4.123961639404297
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,4096,14336,2,8,16,1,power_law_1.2,0.06722559928894042
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,4096,14336,2,8,16,1,balanced,1.987770716349284
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,4096,14336,2,8,16,1,power_law_1.2,0.07263360023498536
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,4096,14336,2,8,16,1,power_law_1.2,0.035020801424980166
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,4096,14336,2,8,16,1,power_law_1.01,0.06103039979934692
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,4096,14336,2,8,16,1,power_law_1.2,0.07739520072937012
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,4096,14336,2,8,16,1,power_law_1.01,0.0642624020576477
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,4096,14336,2,8,16,1,power_law_1.2,0.036627200245857236
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,4096,14336,2,8,16,1,power_law_1.2,0.21960320472717285
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,4096,14336,2,8,16,1,balanced,2.468730608622233
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,4096,14336,2,8,16,1,power_law_1.2,0.04059520065784454
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,4096,14336,2,8,16,1,power_law_1.2,0.5016255855560303
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,4096,14336,2,8,16,1,power_law_1.2,0.05220479965209961
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,4096,14336,2,8,16,1,power_law_1.2,0.08225280046463013
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,4096,14336,2,8,16,1,power_law_1.01,0.06809599995613098
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,4096,14336,2,8,16,1,power_law_1.2,0.05379840135574341
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,4096,14336,2,8,16,1,power_law_1.2,0.0889792025089264
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,4096,14336,2,8,16,1,power_law_1.01,0.07043200135231018
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,4096,14336,2,8,16,1,power_law_1.2,0.05419520139694214
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,4096,14336,2,8,16,1,balanced,3.951173464457194
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,4096,14336,2,8,16,1,power_law_1.2,0.08942080140113831
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,4096,14336,2,8,16,1,power_law_1.01,0.07182719707489013
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,4096,14336,2,8,16,1,power_law_1.2,0.060153597593307497
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,4096,14336,2,8,16,1,power_law_1.2,0.10378880500793457
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,4096,14336,2,8,16,1,power_law_1.01,0.07645440101623535
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,4096,14336,2,8,16,1,power_law_1.2,0.05944960117340088
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,4096,14336,2,8,16,1,power_law_1.2,0.11815040111541748
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,4096,14336,2,8,16,1,power_law_1.2,0.060057598352432254
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,4096,14336,2,8,16,1,power_law_1.01,0.09367679953575134
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,4096,14336,2,8,16,1,power_law_1.2,0.11639039516448975
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,4096,14336,2,8,16,1,power_law_1.2,0.06092159748077393
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,4096,14336,2,8,16,1,power_law_1.2,0.11416959762573242
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,4096,14336,2,8,16,1,power_law_1.2,0.06216959953308106
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,4096,14336,2,8,16,1,power_law_1.01,0.09423999786376953
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,4096,14336,2,8,16,1,power_law_1.2,0.1400320053100586
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,4096,14336,2,8,16,1,power_law_1.2,0.06558079719543457
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,4096,14336,2,8,16,1,power_law_1.01,0.10497920513153076
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,4096,14336,2,8,16,1,balanced,7.834890365600586
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,4096,14336,2,8,16,1,power_law_1.2,0.06800640225410462
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,4096,14336,2,8,16,1,power_law_1.2,0.1611456036567688
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,4096,14336,2,8,16,1,power_law_1.01,0.13338880538940429
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,4096,14336,2,8,16,1,power_law_1.2,0.07711359858512878
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,4096,14336,2,8,16,1,power_law_1.2,0.20161919593811034
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,4096,14336,2,8,16,1,power_law_1.01,0.15854719877243043
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,4096,14336,2,8,16,1,power_law_1.2,0.08861439824104309
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,4096,14336,2,8,16,1,power_law_1.2,0.2227328062057495
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,4096,14336,2,8,16,1,power_law_1.01,0.22080640792846679
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,4096,14336,2,8,16,1,power_law_1.2,0.09037439823150635
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,4096,14336,2,8,16,1,power_law_1.2,0.29592959880828856
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,4096,14336,2,8,16,1,power_law_1.01,0.292409610748291
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,4096,14336,2,8,16,1,power_law_1.2,0.0910975992679596
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,4096,14336,2,8,16,1,power_law_1.2,0.3889024019241333
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,4096,14336,2,8,16,1,power_law_1.01,0.41663360595703125
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,4096,14336,2,8,16,1,power_law_1.2,0.11872639656066894
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,4096,14336,2,8,16,1,power_law_1.2,0.5355455875396729
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,4096,14336,2,8,16,1,power_law_1.01,0.5272192001342774
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,4096,14336,2,8,16,1,power_law_1.2,0.1296447992324829
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,4096,14336,2,8,16,1,power_law_1.2,0.6855616092681884
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,4096,14336,2,8,16,1,power_law_1.01,0.790118408203125
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,4096,14336,2,8,16,1,power_law_1.2,0.16651519536972045
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,4096,14336,2,8,16,1,power_law_1.2,1.019200038909912
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,4096,14336,2,8,16,1,power_law_1.01,1.0117568016052245
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,4096,14336,2,8,16,1,power_law_1.2,0.1811776041984558
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,4096,14336,2,8,16,1,power_law_1.2,1.3228863716125487
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,4096,14336,2,8,16,1,power_law_1.01,1.498969554901123
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,4096,14336,2,8,16,1,power_law_1.2,0.2512448072433472
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,4096,14336,2,8,16,1,power_law_1.2,1.6708799362182618
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,4096,14336,2,8,16,1,power_law_1.2,0.32088959217071533
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,4096,14336,2,8,16,1,power_law_1.01,1.9868288040161133
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,4096,14336,2,8,16,1,power_law_1.2,2.4807807922363283
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,4096,14336,2,8,16,1,power_law_1.2,0.4550911903381348
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,4096,14336,2,8,16,1,power_law_1.01,2.4738496780395507
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,4096,14336,2,8,16,1,power_law_1.2,4.827091217041016
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,4096,14336,2,8,16,1,power_law_1.2,0.5712895870208741
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,4096,14336,2,8,16,1,power_law_1.01,3.915270233154297
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,4096,14336,2,8,16,1,power_law_1.2,0.8394816398620606
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,4096,14336,2,8,16,1,power_law_1.2,1.1194687843322755
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,4096,14336,2,8,16,1,power_law_1.01,7.820735931396484
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,4096,14336,2,8,16,1,power_law_1.2,1.4098752021789551
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,4096,14336,2,8,16,1,power_law_1.2,2.2235200881958006
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,4096,14336,2,8,16,1,power_law_1.2,4.1257984161376955
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,4096,14336,2,8,16,1,power_law_1.2,0.028857600688934327
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,4096,14336,2,8,16,1,power_law_1.2,0.030579200387001036
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,4096,14336,2,8,16,1,power_law_1.2,0.03287039995193482
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,4096,14336,2,8,16,1,power_law_1.2,0.04831359982490539
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,4096,14336,2,8,16,1,power_law_1.2,0.04927360117435455
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,4096,14336,2,8,16,1,power_law_1.2,0.051283198595047
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,4096,14336,2,8,16,1,power_law_1.2,0.05726720094680786
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,6144,16384,2,8,2,8,balanced,0.10607999563217163
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,4096,14336,2,8,16,1,power_law_1.2,0.05751680135726929
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,6144,16384,2,8,2,8,balanced,0.1006666620572408
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,6144,16384,2,8,2,8,balanced,0.10003200173377991
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,4096,14336,2,8,16,1,power_law_1.2,0.06079360246658325
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,6144,16384,2,8,2,8,balanced,0.10083733002344768
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,4096,14336,2,8,16,1,power_law_1.2,0.06341760158538819
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,6144,16384,2,8,2,8,balanced,0.09930666287740071
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,6144,16384,2,8,2,8,balanced,0.10121599833170573
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,4096,14336,2,8,16,1,power_law_1.2,0.06794880032539367
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,6144,16384,2,8,2,8,balanced,0.10109333197275798
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,4096,14336,2,8,16,1,power_law_1.2,0.07009279727935791
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,6144,16384,2,8,2,8,balanced,0.10473600029945374
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,4096,14336,2,8,16,1,power_law_1.2,0.07118719816207886
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,6144,16384,2,8,2,8,balanced,0.07240533332029979
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,6144,16384,2,8,2,8,balanced,0.10661866267522176
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,4096,14336,2,8,16,1,power_law_1.2,0.0762880027294159
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,6144,16384,2,8,2,8,balanced,0.07002666592597961
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,6144,16384,2,8,2,8,balanced,0.10485866665840149
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,4096,14336,2,8,16,1,power_law_1.2,0.09058560132980346
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,6144,16384,2,8,2,8,balanced,0.06925866504510243
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,6144,16384,2,8,2,8,balanced,0.11534933249155681
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,4096,14336,2,8,16,1,power_law_1.2,0.09405440092086792
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,6144,16384,2,8,2,8,balanced,0.0713919997215271
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,4096,14336,2,8,16,1,power_law_1.2,0.10492160320281982
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,6144,16384,2,8,2,8,balanced,0.11170666416486104
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,4096,14336,2,8,16,1,power_law_1.2,0.1307968020439148
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,6144,16384,2,8,2,8,balanced,0.07277866701285045
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,4096,14336,2,8,16,1,power_law_1.2,0.15758719444274902
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,6144,16384,2,8,2,8,balanced,0.111135999361674
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,6144,16384,2,8,2,8,balanced,0.07231466472148895
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,4096,14336,2,8,16,1,power_law_1.2,0.21700479984283447
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,6144,16384,2,8,2,8,balanced,0.07329066594441731
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,6144,16384,2,8,2,8,balanced,0.12005333105723064
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,4096,14336,2,8,16,1,power_law_1.2,0.2919552087783813
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,6144,16384,2,8,2,8,balanced,0.1359946628411611
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,6144,16384,2,8,2,8,balanced,0.07438399891058604
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,4096,14336,2,8,16,1,power_law_1.2,0.4147456169128418
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,4096,14336,2,8,16,1,power_law_1.2,0.5284480094909668
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,6144,16384,2,8,2,8,balanced,0.1358506679534912
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,6144,16384,2,8,2,8,balanced,0.07426133255163829
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,6144,16384,2,8,2,8,balanced,0.13482133547465006
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,6144,16384,2,8,2,8,balanced,0.0751146674156189
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,4096,14336,2,8,16,1,power_law_1.2,0.7868927955627442
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,6144,16384,2,8,2,8,balanced,0.07879999776681264
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,4096,14336,2,8,16,1,power_law_1.2,1.011955165863037
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,6144,16384,2,8,2,8,balanced,0.16820800304412842
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,4096,14336,2,8,16,1,power_law_1.2,1.5011967658996581
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,6144,16384,2,8,2,8,balanced,0.07589333256085713
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,6144,16384,2,8,2,8,balanced,0.1520693302154541
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,4096,14336,2,8,16,1,power_law_1.2,1.992838478088379
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,6144,16384,2,8,2,8,balanced,0.07663466533025105
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,4096,14336,2,8,16,1,power_law_1.2,2.471539115905762
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,6144,16384,2,8,2,8,balanced,0.33294399579366046
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,6144,16384,2,8,2,8,balanced,0.0668213317791621
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,4096,14336,2,8,16,1,power_law_1.2,3.9314369201660155
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,6144,16384,2,8,2,8,balanced,0.0792746643225352
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,6144,16384,2,8,2,8,balanced,0.24558399120966592
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,6144,16384,2,8,2,8,balanced,0.06272533535957336
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,4096,14336,2,8,16,1,power_law_1.2,7.797792053222656
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,6144,16384,2,8,2,8,balanced,0.09576533238093059
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,6144,16384,2,8,2,8,balanced,0.06301333506902058
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,6144,16384,2,8,2,8,balanced,0.3947840134302775
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,6144,16384,2,8,2,8,balanced,0.0974666674931844
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,6144,16384,2,8,2,8,balanced,0.06592000027497609
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,6144,16384,2,8,2,8,balanced,0.4545919895172119
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,6144,16384,2,8,2,8,balanced,0.06694933275381725
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,6144,16384,2,8,2,8,balanced,0.09654933214187622
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,6144,16384,2,8,2,8,balanced,0.06703466673692067
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,6144,16384,2,8,2,8,balanced,0.666810671488444
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,6144,16384,2,8,2,8,balanced,0.11798399686813354
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,6144,16384,2,8,2,8,balanced,0.06772266825040181
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,6144,16384,2,8,2,8,balanced,0.12144000331560771
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,6144,16384,2,8,2,8,balanced,0.7938186327616373
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,6144,16384,2,8,2,8,balanced,0.06730666756629944
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,6144,16384,2,8,2,8,power_law_1.01,0.10398080348968505
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,6144,16384,2,8,2,8,balanced,0.17896000544230142
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,6144,16384,2,8,2,8,power_law_1.01,0.09565439820289612
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,6144,16384,2,8,2,8,balanced,0.17981332540512085
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,6144,16384,2,8,2,8,balanced,1.2137866814931233
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,6144,16384,2,8,2,8,power_law_1.01,0.09611520171165466
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,6144,16384,2,8,2,8,balanced,0.07092266778151195
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,6144,16384,2,8,2,8,balanced,0.27405333518981934
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,6144,16384,2,8,2,8,power_law_1.01,0.09697920083999634
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,6144,16384,2,8,2,8,balanced,0.07257066667079926
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,6144,16384,2,8,2,8,balanced,1.546336015065511
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,6144,16384,2,8,2,8,power_law_1.01,0.09770879745483399
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,6144,16384,2,8,2,8,balanced,0.32359466950098675
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,6144,16384,2,8,2,8,power_law_1.01,0.10559999942779541
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,6144,16384,2,8,2,8,balanced,0.46407465140024823
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,6144,16384,2,8,2,8,power_law_1.01,0.11441919803619385
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,6144,16384,2,8,2,8,power_law_1.01,0.11690239906311035
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,6144,16384,2,8,2,8,balanced,1.964469273885091
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,6144,16384,2,8,2,8,power_law_1.01,0.34321279525756837
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,6144,16384,2,8,2,8,balanced,0.5660320123036703
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,6144,16384,2,8,2,8,power_law_1.01,0.7986688137054443
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,6144,16384,2,8,2,8,balanced,0.07234133283297221
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,6144,16384,2,8,2,8,power_law_1.01,1.2737664222717284
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,6144,16384,2,8,2,8,balanced,0.07363200187683105
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,6144,16384,2,8,2,8,balanced,0.8469546635945638
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,6144,16384,2,8,2,8,power_law_1.01,1.2908479690551757
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,6144,16384,2,8,2,8,balanced,0.07518399755160014
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,6144,16384,2,8,2,8,balanced,3.059376080830892
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,6144,16384,2,8,2,8,power_law_1.01,1.3165120124816894
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,6144,16384,2,8,2,8,balanced,0.0749120016892751
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,6144,16384,2,8,2,8,power_law_1.01,0.17523200511932374
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,6144,16384,2,8,2,8,balanced,1.090773344039917
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,6144,16384,2,8,2,8,power_law_1.01,0.21987199783325195
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,6144,16384,2,8,2,8,power_law_1.01,0.07159680128097534
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,6144,16384,2,8,2,8,power_law_1.01,0.2459968090057373
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,6144,16384,2,8,2,8,power_law_1.01,0.06893439888954163
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,6144,16384,2,8,2,8,power_law_1.01,0.312825608253479
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,6144,16384,2,8,2,8,balanced,1.3690826098124187
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,6144,16384,2,8,2,8,power_law_1.01,0.06888319849967957
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,6144,16384,2,8,2,8,power_law_1.01,0.5137919902801513
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,6144,16384,2,8,2,8,balanced,0.0844106674194336
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,6144,16384,2,8,2,8,power_law_1.01,0.06513280272483826
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,6144,16384,2,8,2,8,power_law_1.01,0.07109119892120361
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,6144,16384,2,8,2,8,power_law_1.01,0.47930240631103516
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,6144,16384,2,8,2,8,balanced,6.112010955810547
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,6144,16384,2,8,2,8,balanced,0.08700799942016602
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,6144,16384,2,8,2,8,power_law_1.01,0.07004799842834472
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,6144,16384,2,8,2,8,power_law_1.01,0.647814416885376
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,6144,16384,2,8,2,8,power_law_1.01,0.06144639849662781
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,6144,16384,2,8,2,8,power_law_1.01,0.0803391993045807
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,6144,16384,2,8,2,8,balanced,0.08841066559155782
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,6144,16384,2,8,2,8,power_law_1.2,0.10408320426940917
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,6144,16384,2,8,2,8,power_law_1.01,0.7197375774383545
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,6144,16384,2,8,2,8,power_law_1.01,0.06240000128746033
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,6144,16384,2,8,2,8,balanced,2.1399787267049155
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,6144,16384,2,8,2,8,power_law_1.01,0.08076159954071045
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,6144,16384,2,8,2,8,power_law_1.01,1.1253696441650392
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,6144,16384,2,8,2,8,power_law_1.2,0.09943680167198181
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,6144,16384,2,8,2,8,power_law_1.01,0.06509439945220948
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,6144,16384,2,8,2,8,power_law_1.01,0.07712000012397766
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,6144,16384,2,8,2,8,power_law_1.01,1.288742446899414
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,6144,16384,2,8,2,8,power_law_1.2,0.09939839839935302
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,6144,16384,2,8,2,8,power_law_1.01,0.06600959897041321
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,6144,16384,2,8,2,8,power_law_1.01,0.08324480056762695
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,6144,16384,2,8,2,8,balanced,0.11357333262761433
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,6144,16384,2,8,2,8,power_law_1.01,2.029657554626465
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,6144,16384,2,8,2,8,power_law_1.2,0.09912319779396057
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,6144,16384,2,8,2,8,power_law_1.01,0.07601919770240784
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,6144,16384,2,8,2,8,power_law_1.01,0.09130240082740784
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,6144,16384,2,8,2,8,power_law_1.2,0.09883520007133484
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,6144,16384,2,8,2,8,balanced,0.11902399857838948
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,6144,16384,2,8,2,8,power_law_1.01,0.09459199905395507
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,6144,16384,2,8,2,8,power_law_1.01,2.7364479064941407
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,6144,16384,2,8,2,8,power_law_1.01,0.08511999845504761
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,6144,16384,2,8,2,8,power_law_1.2,0.10794880390167236
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,6144,16384,2,8,2,8,power_law_1.01,0.09997439980506898
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,6144,16384,2,8,2,8,power_law_1.01,0.09271039962768554
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,6144,16384,2,8,2,8,power_law_1.01,4.331718444824219
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,6144,16384,2,8,2,8,power_law_1.2,0.12511999607086183
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,6144,16384,2,8,2,8,power_law_1.01,0.10613759756088256
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,6144,16384,2,8,2,8,power_law_1.01,6.087705612182617
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,6144,16384,2,8,2,8,power_law_1.01,0.09947519898414611
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,6144,16384,2,8,2,8,power_law_1.2,0.11670399904251098
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,6144,16384,2,8,2,8,balanced,0.1637279987335205
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,6144,16384,2,8,2,8,power_law_1.01,0.12936320304870605
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,6144,16384,2,8,2,8,balanced,4.1938934326171875
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,6144,16384,2,8,2,8,power_law_1.2,0.8048383712768554
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,6144,16384,2,8,2,8,power_law_1.01,0.11283199787139893
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,6144,16384,2,8,2,8,power_law_1.01,7.665376281738281
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,6144,16384,2,8,2,8,power_law_1.01,0.15374720096588135
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,6144,16384,2,8,2,8,balanced,0.202239990234375
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,6144,16384,2,8,2,8,power_law_1.2,1.0315648078918458
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,6144,16384,2,8,2,8,power_law_1.01,0.18306560516357423
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,6144,16384,2,8,2,8,power_law_1.01,12.839704895019532
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,6144,16384,2,8,2,8,balanced,0.2927093307177226
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,6144,16384,2,8,2,8,power_law_1.01,0.20675199031829833
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,6144,16384,2,8,2,8,power_law_1.2,1.2616064071655273
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,6144,16384,2,8,2,8,power_law_1.01,0.09559680223464966
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,6144,16384,2,8,2,8,power_law_1.01,0.26476800441741943
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,6144,16384,2,8,2,8,power_law_1.2,1.284774398803711
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,6144,16384,2,8,2,8,balanced,0.34939201672871906
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,6144,16384,2,8,2,8,power_law_1.01,0.11635839939117432
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,6144,16384,2,8,2,8,power_law_1.01,0.2787264108657837
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,6144,16384,2,8,2,8,power_law_1.01,24.937901306152344
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,6144,16384,2,8,2,8,power_law_1.2,1.322982406616211
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,6144,16384,2,8,2,8,power_law_1.01,0.11636480093002319
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,6144,16384,2,8,2,8,power_law_1.01,0.4378367900848389
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,6144,16384,2,8,2,8,power_law_1.2,0.1846783995628357
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,6144,16384,2,8,2,8,power_law_1.01,0.1472767949104309
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,6144,16384,2,8,2,8,power_law_1.01,0.47045121192932127
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,6144,16384,2,8,2,8,power_law_1.2,0.2493311882019043
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,6144,16384,2,8,2,8,power_law_1.01,0.6807424068450928
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,6144,16384,2,8,2,8,power_law_1.2,0.2339008092880249
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,6144,16384,2,8,2,8,power_law_1.01,0.7639488220214844
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,6144,16384,2,8,2,8,balanced,0.5350026686986288
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,6144,16384,2,8,2,8,power_law_1.01,0.14180480241775512
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,6144,16384,2,8,2,8,power_law_1.2,0.3159424066543579
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,6144,16384,2,8,2,8,power_law_1.01,1.332153606414795
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,6144,16384,2,8,2,8,power_law_1.01,0.15047680139541625
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,6144,16384,2,8,2,8,power_law_1.2,0.5114943981170654
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,6144,16384,2,8,2,8,power_law_1.01,1.7778175354003907
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,6144,16384,2,8,2,8,balanced,0.6993172963460287
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,6144,16384,2,8,2,8,power_law_1.01,0.19943039417266845
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,6144,16384,2,8,2,8,power_law_1.2,0.4773568153381348
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,6144,16384,2,8,2,8,power_law_1.01,2.693414306640625
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,6144,16384,2,8,2,8,power_law_1.2,0.666860818862915
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,6144,16384,2,8,2,8,power_law_1.01,0.27721600532531737
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,6144,16384,2,8,2,8,power_law_1.01,3.3363712310791014
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,6144,16384,2,8,2,8,balanced,1.0457066694895427
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,6144,16384,2,8,2,8,power_law_1.2,0.7788479804992676
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,6144,16384,2,8,2,8,power_law_1.01,0.31141760349273684
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,6144,16384,2,8,2,8,power_law_1.01,4.207462310791016
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,6144,16384,2,8,2,8,power_law_1.2,1.0253439903259278
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,6144,16384,2,8,2,8,power_law_1.01,7.083897399902344
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,6144,16384,2,8,2,8,power_law_1.01,0.5074751853942872
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,6144,16384,2,8,2,8,balanced,1.380282719930013
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,6144,16384,2,8,2,8,power_law_1.2,1.4603584289550782
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,6144,16384,2,8,2,8,power_law_1.01,0.6682432174682618
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,6144,16384,2,8,2,8,power_law_1.2,2.096928024291992
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,6144,16384,2,8,2,8,power_law_1.01,14.307058715820313
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,6144,16384,2,8,2,8,power_law_1.01,1.055072021484375
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,6144,16384,2,8,2,8,power_law_1.2,2.7643711090087892
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,6144,16384,2,8,2,8,balanced,1.6952160199483235
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,6144,16384,2,8,2,8,power_law_1.2,0.07137280106544494
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,6144,16384,2,8,2,8,power_law_1.01,1.307583999633789
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,6144,16384,2,8,2,8,power_law_1.2,4.4844928741455075
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,6144,16384,2,8,2,8,power_law_1.2,0.06918399930000305
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,6144,16384,2,8,2,8,power_law_1.2,6.219673538208008
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,6144,16384,2,8,2,8,power_law_1.2,0.06870399713516236
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,6144,16384,2,8,2,8,power_law_1.01,1.8003200531005858
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,6144,16384,2,8,2,8,power_law_1.2,0.07088000178337098
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,6144,16384,2,8,2,8,power_law_1.2,7.539212799072265
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,6144,16384,2,8,2,8,power_law_1.01,2.5855552673339846
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,6144,16384,2,8,2,8,balanced,2.7005440394083657
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,6144,16384,2,8,2,8,power_law_1.2,0.07050880193710327
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,6144,16384,2,8,2,8,power_law_1.01,3.220332717895508
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,6144,16384,2,8,2,8,power_law_1.2,0.08035200238227844
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,6144,16384,2,8,2,8,power_law_1.2,11.77795181274414
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,6144,16384,2,8,2,8,power_law_1.2,0.08408960103988647
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,6144,16384,2,8,2,8,power_law_1.01,4.916287994384765
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,6144,16384,2,8,2,8,power_law_1.2,0.07713279724121094
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,6144,16384,2,8,2,8,power_law_1.01,6.354361724853516
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,6144,16384,2,8,2,8,power_law_1.2,0.08034560084342957
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,6144,16384,2,8,2,8,power_law_1.2,25.062086486816405
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,6144,16384,2,8,2,8,power_law_1.2,0.08387200236320495
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,6144,16384,2,8,2,8,power_law_1.01,9.409375762939453
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,6144,16384,2,8,2,8,power_law_1.2,0.08715519905090333
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,6144,16384,2,8,2,8,balanced,5.307589213053386
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,6144,16384,2,8,2,8,power_law_1.2,0.10119680166244507
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,6144,16384,2,8,2,8,power_law_1.01,20.19000244140625
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,6144,16384,2,8,2,8,power_law_1.2,0.09859840273857116
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,6144,16384,2,8,2,8,power_law_1.2,0.12239359617233277
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,6144,16384,2,8,2,8,power_law_1.2,0.16750719547271728
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,6144,16384,2,8,2,8,power_law_1.2,0.1660223960876465
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,6144,16384,2,8,2,8,power_law_1.2,0.17927680015563965
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,6144,16384,2,8,2,8,power_law_1.2,0.26226561069488524
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,6144,16384,2,8,2,8,power_law_1.2,0.31672959327697753
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,6144,16384,2,8,2,8,power_law_1.2,0.4601920127868652
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,6144,16384,2,8,2,8,power_law_1.2,0.47093758583068845
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,6144,16384,2,8,2,8,power_law_1.2,0.7079103946685791
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,6144,16384,2,8,2,8,power_law_1.2,0.8729151725769043
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,6144,16384,2,8,2,8,power_law_1.2,1.3396160125732421
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,6144,16384,2,8,2,8,power_law_1.2,1.7741119384765625
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,6144,16384,2,8,2,8,power_law_1.2,2.463692855834961
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,6144,16384,2,8,2,8,power_law_1.2,3.3069759368896485
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,6144,16384,2,8,2,8,power_law_1.2,4.35456657409668
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,6144,16384,2,8,2,8,power_law_1.2,0.0651968002319336
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,6144,16384,2,8,2,8,power_law_1.2,6.715142059326172
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,6144,16384,2,8,2,8,power_law_1.2,0.06206079721450806
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,6144,16384,2,8,2,8,power_law_1.2,13.828384399414062
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,6144,16384,2,8,2,8,power_law_1.2,0.06228479743003845
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,6144,16384,2,8,2,8,power_law_1.2,0.06528639793395996
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,6144,16384,2,8,2,8,power_law_1.2,0.06599680185317994
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,6144,16384,2,8,4,4,balanced,0.07354666789372762
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,6144,16384,2,8,2,8,power_law_1.2,0.07916799783706666
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,6144,16384,2,8,4,4,balanced,0.07044800122578938
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,6144,16384,2,8,2,8,power_law_1.2,0.08960000276565552
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,6144,16384,2,8,4,4,balanced,0.09643733501434326
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,6144,16384,2,8,2,8,power_law_1.2,0.10505599975585937
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,6144,16384,2,8,4,4,balanced,0.09934399525324504
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,6144,16384,2,8,4,4,balanced,0.09878933429718018
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,6144,16384,2,8,2,8,power_law_1.2,0.10234240293502808
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,6144,16384,2,8,4,4,balanced,0.09959466258684795
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,6144,16384,2,8,4,4,balanced,0.05097066859404246
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,6144,16384,2,8,2,8,power_law_1.2,0.1133952021598816
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,6144,16384,2,8,4,4,balanced,0.10178132851918538
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,6144,16384,2,8,4,4,balanced,0.04937600096066793
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,6144,16384,2,8,4,4,balanced,0.10051199793815613
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,6144,16384,2,8,4,4,balanced,0.06569600105285645
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,6144,16384,2,8,2,8,power_law_1.2,0.09513599872589111
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,6144,16384,2,8,4,4,balanced,0.06808533271153767
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,6144,16384,2,8,4,4,balanced,0.10377066334088643
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,6144,16384,2,8,2,8,power_law_1.2,0.12103040218353271
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,6144,16384,2,8,4,4,balanced,0.06993600229422252
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,6144,16384,2,8,4,4,balanced,0.10485866665840149
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,6144,16384,2,8,2,8,power_law_1.2,0.11879680156707764
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,6144,16384,2,8,4,4,balanced,0.07022933165232341
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,6144,16384,2,8,4,4,balanced,0.1090719997882843
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,6144,16384,2,8,2,8,power_law_1.2,0.1423807978630066
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,6144,16384,2,8,4,4,balanced,0.07046933472156525
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,6144,16384,2,8,4,4,balanced,0.10739733775456746
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,6144,16384,2,8,4,4,balanced,0.07123733560244243
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,6144,16384,2,8,4,4,balanced,0.10789866248766582
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,6144,16384,2,8,2,8,power_law_1.2,0.15137920379638672
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,6144,16384,2,8,4,4,balanced,0.07137066622575124
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,6144,16384,2,8,4,4,balanced,0.1132533351580302
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,6144,16384,2,8,4,4,balanced,0.07197333375612895
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,6144,16384,2,8,4,4,balanced,0.13038399815559387
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,6144,16384,2,8,2,8,power_law_1.2,0.162009596824646
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,6144,16384,2,8,4,4,balanced,0.13209600249926248
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,6144,16384,2,8,4,4,balanced,0.07343466579914093
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,6144,16384,2,8,2,8,power_law_1.2,0.20841600894927978
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,6144,16384,2,8,4,4,balanced,0.13725333412488303
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,6144,16384,2,8,4,4,balanced,0.07392000158627827
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,6144,16384,2,8,4,4,balanced,0.15922133127848306
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,6144,16384,2,8,2,8,power_law_1.2,0.248089599609375
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,6144,16384,2,8,4,4,balanced,0.07577066620190938
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,6144,16384,2,8,4,4,balanced,0.1530133287111918
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,6144,16384,2,8,2,8,power_law_1.2,0.3364799976348877
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,6144,16384,2,8,4,4,balanced,0.07986133297284444
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,6144,16384,2,8,4,4,balanced,0.25942933559417725
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,6144,16384,2,8,4,4,balanced,0.09243200222651164
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,6144,16384,2,8,2,8,power_law_1.2,0.5602880001068116
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,6144,16384,2,8,4,4,balanced,0.2600959936777751
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,6144,16384,2,8,4,4,balanced,0.09311999877293904
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,6144,16384,2,8,2,8,power_law_1.2,0.611027193069458
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,6144,16384,2,8,4,4,balanced,0.3651680151621501
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,6144,16384,2,8,4,4,balanced,0.09874666730562846
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,6144,16384,2,8,2,8,power_law_1.2,1.1098048210144043
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,6144,16384,2,8,4,4,balanced,0.11312533418337505
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,6144,16384,2,8,4,4,balanced,0.43565332889556885
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,6144,16384,2,8,2,8,power_law_1.2,1.308396816253662
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,6144,16384,2,8,4,4,balanced,0.11752532919247945
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,6144,16384,2,8,4,4,balanced,0.044810667634010315
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,6144,16384,2,8,4,4,balanced,0.6499786774317423
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,6144,16384,2,8,2,8,power_law_1.2,1.8471040725708008
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,6144,16384,2,8,4,4,balanced,0.18157867590586343
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,6144,16384,2,8,4,4,balanced,0.0430026650428772
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,6144,16384,2,8,2,8,power_law_1.2,2.4903743743896483
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,6144,16384,2,8,4,4,balanced,0.8226026693979899
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,6144,16384,2,8,4,4,balanced,0.19139200448989868
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,6144,16384,2,8,4,4,balanced,0.06062933305899302
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,6144,16384,2,8,2,8,power_law_1.2,3.8107200622558595
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,6144,16384,2,8,4,4,balanced,0.06311466793219249
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,6144,16384,2,8,4,4,balanced,0.26707732677459717
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,6144,16384,2,8,4,4,balanced,0.06468266745408376
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,6144,16384,2,8,4,4,balanced,1.223413308461507
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,6144,16384,2,8,2,8,power_law_1.2,4.9350017547607425
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,6144,16384,2,8,4,4,balanced,0.32518933216730755
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,6144,16384,2,8,4,4,balanced,0.06497066716353099
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,6144,16384,2,8,4,4,balanced,0.06547733147939046
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,6144,16384,2,8,2,8,power_law_1.2,6.35346565246582
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,6144,16384,2,8,4,4,balanced,0.4700426657994588
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,6144,16384,2,8,4,4,balanced,1.604453404744466
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,6144,16384,2,8,4,4,balanced,0.06579199930032094
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,6144,16384,2,8,4,4,power_law_1.01,0.10090880393981934
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,6144,16384,2,8,2,8,power_law_1.2,10.123027038574218
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,6144,16384,2,8,4,4,power_law_1.01,0.08762239813804626
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,6144,16384,2,8,4,4,balanced,0.5952693223953247
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,6144,16384,2,8,4,4,power_law_1.01,0.06678400039672852
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,6144,16384,2,8,4,4,power_law_1.01,0.08413439989089966
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,6144,16384,2,8,4,4,balanced,1.9981226921081543
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,6144,16384,2,8,2,8,power_law_1.2,19.38385925292969
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,6144,16384,2,8,4,4,power_law_1.01,0.09792640209197997
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,6144,16384,2,8,4,4,power_law_1.01,0.054527997970581055
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,6144,16384,2,8,4,4,balanced,0.86899733543396
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,6144,16384,2,8,4,4,balanced,0.06659199794133504
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,6144,16384,2,8,4,4,power_law_1.01,0.05839999914169312
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,6144,16384,2,8,4,4,power_law_1.01,0.09811840057373047
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,6144,16384,2,8,4,4,power_law_1.01,0.06817920207977295
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,6144,16384,2,8,4,4,power_law_1.01,0.11008640527725219
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,6144,16384,2,8,4,4,power_law_1.01,0.05235840082168579
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,6144,16384,2,8,4,4,balanced,0.06713599960009257
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,6144,16384,2,8,4,4,power_law_1.01,0.06902400255203248
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,6144,16384,2,8,4,4,power_law_1.01,0.11178879737854004
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,6144,16384,2,8,4,4,power_law_1.01,0.07081599831581116
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,6144,16384,2,8,4,4,power_law_1.01,0.05688959956169128
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,6144,16384,2,8,4,4,balanced,1.151477336883545
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,6144,16384,2,8,4,4,power_law_1.01,0.07705600261688232
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,6144,16384,2,8,4,4,balanced,3.158752123514811
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,6144,16384,2,8,4,4,power_law_1.01,0.11560959815979004
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,6144,16384,2,8,4,4,power_law_1.01,0.07939199805259704
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,6144,16384,2,8,4,4,power_law_1.01,0.053491199016571046
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,6144,16384,2,8,4,4,power_law_1.01,0.08081279993057251
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,6144,16384,2,8,4,4,power_law_1.01,0.5433472156524658
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,6144,16384,2,8,4,4,power_law_1.01,0.06387839913368225
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,6144,16384,2,8,4,4,power_law_1.01,0.08150399923324585
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,6144,16384,2,8,4,4,power_law_1.01,0.08387839794158936
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,6144,16384,2,8,4,4,power_law_1.01,0.5443583965301514
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,6144,16384,2,8,4,4,power_law_1.01,0.06338559985160827
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,6144,16384,2,8,4,4,balanced,1.4401226043701172
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,6144,16384,2,8,4,4,power_law_1.01,0.09229440093040467
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,6144,16384,2,8,4,4,power_law_1.01,0.13755520582199096
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,6144,16384,2,8,4,4,power_law_1.01,0.07277439832687378
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,6144,16384,2,8,4,4,power_law_1.01,0.09247360229492188
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,6144,16384,2,8,4,4,balanced,0.06986133257548015
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,6144,16384,2,8,4,4,power_law_1.01,0.11386879682540893
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,6144,16384,2,8,4,4,power_law_1.01,0.1400383949279785
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,6144,16384,2,8,4,4,power_law_1.01,0.081004798412323
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,6144,16384,2,8,4,4,balanced,0.07132799923419952
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,6144,16384,2,8,4,4,power_law_1.01,0.1312384009361267
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,6144,16384,2,8,4,4,power_law_1.01,0.08652799725532531
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,6144,16384,2,8,4,4,power_law_1.01,0.13865599632263184
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,6144,16384,2,8,4,4,power_law_1.01,0.14141440391540527
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,6144,16384,2,8,4,4,balanced,0.07380799949169159
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,6144,16384,2,8,4,4,power_law_1.01,0.1350335955619812
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,6144,16384,2,8,4,4,balanced,2.2446187337239585
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,6144,16384,2,8,4,4,power_law_1.01,0.16717439889907837
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,6144,16384,2,8,4,4,power_law_1.01,0.18535679578781128
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,6144,16384,2,8,4,4,balanced,6.2292054494222
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,6144,16384,2,8,4,4,balanced,0.0745600014925003
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,6144,16384,2,8,4,4,power_law_1.01,0.18856960535049438
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,6144,16384,2,8,4,4,power_law_1.01,0.23390719890594483
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,6144,16384,2,8,4,4,power_law_1.01,0.09144319891929627
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,6144,16384,2,8,4,4,power_law_1.01,0.2890944004058838
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,6144,16384,2,8,4,4,power_law_1.01,0.24236159324645995
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,6144,16384,2,8,4,4,power_law_1.01,0.3757888078689575
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,6144,16384,2,8,4,4,power_law_1.01,0.09125760197639465
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,6144,16384,2,8,4,4,power_law_1.01,0.21789441108703614
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,6144,16384,2,8,4,4,power_law_1.01,0.5071743965148926
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,6144,16384,2,8,4,4,power_law_1.01,0.6497727870941162
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,6144,16384,2,8,4,4,balanced,0.08357866605122884
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,6144,16384,2,8,4,4,power_law_1.01,0.3041663885116577
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,6144,16384,2,8,4,4,power_law_1.01,0.9981887817382813
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,6144,16384,2,8,4,4,power_law_1.01,0.325817608833313
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,6144,16384,2,8,4,4,power_law_1.01,0.0852288007736206
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,6144,16384,2,8,4,4,power_law_1.01,1.2334464073181153
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,6144,16384,2,8,4,4,balanced,0.08558400472005208
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,6144,16384,2,8,4,4,power_law_1.01,0.41826558113098145
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,6144,16384,2,8,4,4,power_law_1.01,1.8863040924072265
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,6144,16384,2,8,4,4,power_law_1.01,0.08757759928703308
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,6144,16384,2,8,4,4,balanced,0.08943999807039897
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,6144,16384,2,8,4,4,power_law_1.01,2.4545215606689452
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,6144,16384,2,8,4,4,power_law_1.01,0.5353919982910156
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,6144,16384,2,8,4,4,balanced,4.38694413503011
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,6144,16384,2,8,4,4,power_law_1.01,0.09637759923934937
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,6144,16384,2,8,4,4,power_law_1.2,0.10819200277328492
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,6144,16384,2,8,4,4,balanced,0.1192586620648702
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,6144,16384,2,8,4,4,power_law_1.01,3.2913856506347656
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,6144,16384,2,8,4,4,power_law_1.01,0.8047807693481446
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,6144,16384,2,8,4,4,power_law_1.01,0.11937919855117798
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,6144,16384,2,8,4,4,power_law_1.01,3.9198463439941404
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,6144,16384,2,8,4,4,balanced,0.12863999605178833
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,6144,16384,2,8,4,4,power_law_1.2,0.08265600204467774
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,6144,16384,2,8,4,4,power_law_1.01,1.0814399719238281
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,6144,16384,2,8,4,4,power_law_1.2,0.09479680061340331
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,6144,16384,2,8,4,4,balanced,0.17513600985209146
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,6144,16384,2,8,4,4,power_law_1.01,8.674163055419921
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,6144,16384,2,8,4,4,power_law_1.01,0.11886080503463745
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,6144,16384,2,8,4,4,power_law_1.01,1.4181376457214356
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,6144,16384,2,8,4,4,power_law_1.2,0.09781759977340698
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,6144,16384,2,8,4,4,balanced,0.21472533543904623
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,6144,16384,2,8,4,4,power_law_1.01,0.1393728017807007
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,6144,16384,2,8,4,4,power_law_1.2,0.09830399751663207
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,6144,16384,2,8,4,4,power_law_1.01,2.3593471527099608
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,6144,16384,2,8,4,4,power_law_1.01,0.16955519914627076
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,6144,16384,2,8,4,4,power_law_1.2,0.10973440408706665
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,6144,16384,2,8,4,4,power_law_1.01,3.619807815551758
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,6144,16384,2,8,4,4,power_law_1.01,0.1975808024406433
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,6144,16384,2,8,4,4,power_law_1.2,0.1144063949584961
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,6144,16384,2,8,4,4,power_law_1.01,4.073600006103516
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,6144,16384,2,8,4,4,power_law_1.01,0.2712064027786255
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,6144,16384,2,8,4,4,power_law_1.2,0.11685760021209717
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,6144,16384,2,8,4,4,balanced,0.32147733370463055
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,6144,16384,2,8,4,4,power_law_1.01,0.43123202323913573
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,6144,16384,2,8,4,4,power_law_1.01,4.949241638183594
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,6144,16384,2,8,4,4,power_law_1.2,0.5395008087158203
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,6144,16384,2,8,4,4,balanced,0.41387200355529785
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,6144,16384,2,8,4,4,power_law_1.01,0.5697792053222657
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,6144,16384,2,8,4,4,power_law_1.2,0.9640383720397949
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,6144,16384,2,8,4,4,power_law_1.01,7.957734680175781
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,6144,16384,2,8,4,4,power_law_1.2,0.13699840307235717
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,6144,16384,2,8,4,4,balanced,0.6570080121358236
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,6144,16384,2,8,4,4,power_law_1.01,0.7220992088317871
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,6144,16384,2,8,4,4,power_law_1.2,0.14625920057296754
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,6144,16384,2,8,4,4,power_law_1.01,19.216018676757812
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,6144,16384,2,8,4,4,balanced,0.8668853441874186
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,6144,16384,2,8,4,4,power_law_1.2,0.1493888020515442
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,6144,16384,2,8,4,4,power_law_1.01,1.0791872024536133
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,6144,16384,2,8,4,4,power_law_1.01,1.531942367553711
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,6144,16384,2,8,4,4,power_law_1.2,0.17547520399093627
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,6144,16384,2,8,4,4,balanced,1.280138651529948
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,6144,16384,2,8,4,4,power_law_1.01,2.3994367599487303
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,6144,16384,2,8,4,4,power_law_1.2,0.22423040866851807
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,6144,16384,2,8,4,4,power_law_1.2,0.20032000541687012
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,6144,16384,2,8,4,4,power_law_1.01,3.8051521301269533
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,6144,16384,2,8,4,4,balanced,1.7084159851074219
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,6144,16384,2,8,4,4,power_law_1.2,0.22156159877777098
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,6144,16384,2,8,4,4,power_law_1.01,4.409785461425781
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,6144,16384,2,8,4,4,power_law_1.2,0.2599616050720215
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,6144,16384,2,8,4,4,power_law_1.01,5.793132781982422
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,6144,16384,2,8,4,4,power_law_1.2,0.3211008071899414
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,6144,16384,2,8,4,4,balanced,2.122591972351074
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,6144,16384,2,8,4,4,power_law_1.2,0.4445504188537598
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,6144,16384,2,8,4,4,power_law_1.01,9.428173065185547
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,6144,16384,2,8,4,4,power_law_1.2,0.5940608024597168
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,6144,16384,2,8,4,4,power_law_1.01,17.37986602783203
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,6144,16384,2,8,4,4,power_law_1.2,0.8918592453002929
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,6144,16384,2,8,4,4,balanced,3.403663953145345
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,6144,16384,2,8,4,4,power_law_1.2,1.3519295692443847
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,6144,16384,2,8,4,4,power_law_1.2,1.6733888626098632
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,6144,16384,2,8,4,4,power_law_1.2,2.291084861755371
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,6144,16384,2,8,4,4,power_law_1.2,3.4436672210693358
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,6144,16384,2,8,4,4,power_law_1.2,4.525299072265625
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,6144,16384,2,8,4,4,power_law_1.2,5.122873687744141
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,6144,16384,2,8,4,4,balanced,6.804010391235352
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,6144,16384,2,8,4,4,power_law_1.2,9.110585784912109
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,6144,16384,2,8,4,4,power_law_1.2,16.133241271972658
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,6144,16384,2,8,4,4,power_law_1.2,0.06284800171852112
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,6144,16384,2,8,4,4,power_law_1.2,0.06095359921455383
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,6144,16384,2,8,4,4,power_law_1.2,0.058412802219390866
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,6144,16384,2,8,4,4,power_law_1.2,0.06795520186424256
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,6144,16384,2,8,4,4,power_law_1.2,0.06863999962806702
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,6144,16384,2,8,4,4,power_law_1.2,0.0689791977405548
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,6144,16384,2,8,4,4,power_law_1.2,0.07612159848213196
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,6144,16384,2,8,4,4,power_law_1.2,0.07992320060729981
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,6144,16384,2,8,4,4,power_law_1.2,0.08356480002403259
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,6144,16384,2,8,4,4,power_law_1.2,0.08840960264205933
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,6144,16384,2,8,4,4,power_law_1.2,0.08831999897956848
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,6144,16384,2,8,4,4,power_law_1.2,0.08951039910316468
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,6144,16384,2,8,4,4,power_law_1.2,0.06040319800376892
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,6144,16384,2,8,4,4,power_law_1.2,0.0934719979763031
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,6144,16384,2,8,4,4,power_law_1.2,0.056601601839065555
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,6144,16384,2,8,4,4,power_law_1.2,0.11643520593643189
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,6144,16384,2,8,8,2,balanced,0.050213331977526345
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,6144,16384,2,8,4,4,power_law_1.2,0.053376001119613645
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,6144,16384,2,8,4,4,power_law_1.2,0.06312320232391358
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,6144,16384,2,8,4,4,power_law_1.2,0.1304128050804138
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,6144,16384,2,8,8,2,balanced,0.06468266745408376
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,6144,16384,2,8,8,2,balanced,0.03726933399836222
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,6144,16384,2,8,4,4,power_law_1.2,0.0641152024269104
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,6144,16384,2,8,4,4,power_law_1.2,0.07884160280227662
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,6144,16384,2,8,4,4,power_law_1.2,0.14079359769821168
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,6144,16384,2,8,8,2,balanced,0.09735999504725139
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,6144,16384,2,8,4,4,power_law_1.2,0.08275200128555298
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,6144,16384,2,8,8,2,balanced,0.048528000712394714
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,6144,16384,2,8,4,4,power_law_1.2,0.15482879877090455
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,6144,16384,2,8,8,2,balanced,0.09927999973297119
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,6144,16384,2,8,4,4,power_law_1.2,0.08264319896697998
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,6144,16384,2,8,8,2,balanced,0.06439466774463654
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,6144,16384,2,8,4,4,power_law_1.2,0.19757440090179443
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,6144,16384,2,8,8,2,balanced,0.09942400455474854
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,6144,16384,2,8,8,2,balanced,0.06865600248177846
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,6144,16384,2,8,4,4,power_law_1.2,0.2111680030822754
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,6144,16384,2,8,4,4,power_law_1.2,0.08739839792251587
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,6144,16384,2,8,8,2,balanced,0.10027733445167542
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,6144,16384,2,8,8,2,balanced,0.06876266499360402
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,6144,16384,2,8,4,4,power_law_1.2,0.09441919922828675
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,6144,16384,2,8,8,2,balanced,0.07018133501211803
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,6144,16384,2,8,8,2,balanced,0.10000532865524292
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,6144,16384,2,8,4,4,power_law_1.2,0.31499519348144533
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,6144,16384,2,8,8,2,balanced,0.07030400137106578
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,6144,16384,2,8,8,2,balanced,0.10428800185521443
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,6144,16384,2,8,4,4,power_law_1.2,0.41383042335510256
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,6144,16384,2,8,4,4,power_law_1.2,0.08485119938850402
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,6144,16384,2,8,8,2,balanced,0.0706826647122701
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,6144,16384,2,8,8,2,balanced,0.10325866937637329
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,6144,16384,2,8,4,4,power_law_1.2,0.537824010848999
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,6144,16384,2,8,4,4,power_law_1.2,0.08891519904136658
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,6144,16384,2,8,8,2,balanced,0.07123733560244243
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,6144,16384,2,8,8,2,balanced,0.10402666529019673
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,6144,16384,2,8,4,4,power_law_1.2,0.09895039796829223
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,6144,16384,2,8,4,4,power_law_1.2,0.64584321975708
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,6144,16384,2,8,8,2,balanced,0.0729013333717982
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,6144,16384,2,8,8,2,balanced,0.108106662829717
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,6144,16384,2,8,4,4,power_law_1.2,0.11859840154647827
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,6144,16384,2,8,4,4,power_law_1.2,1.0071040153503419
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,6144,16384,2,8,8,2,balanced,0.07478400071461995
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,6144,16384,2,8,8,2,balanced,0.1076800028483073
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,6144,16384,2,8,4,4,power_law_1.2,0.13256959915161132
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,6144,16384,2,8,4,4,power_law_1.2,1.543283176422119
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,6144,16384,2,8,8,2,balanced,0.07606933514277141
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,6144,16384,2,8,8,2,balanced,0.1090773344039917
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,6144,16384,2,8,4,4,power_law_1.2,0.1218176007270813
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,6144,16384,2,8,4,4,power_law_1.2,0.17709439992904663
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,6144,16384,2,8,8,2,balanced,0.07761066655317943
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,6144,16384,2,8,4,4,power_law_1.2,2.044806480407715
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,6144,16384,2,8,8,2,balanced,0.11783466736475627
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,6144,16384,2,8,4,4,power_law_1.2,0.23729279041290283
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,6144,16384,2,8,8,2,balanced,0.07978133360544841
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,6144,16384,2,8,4,4,power_law_1.2,0.3076479911804199
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,6144,16384,2,8,8,2,balanced,0.12110400199890137
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,6144,16384,2,8,4,4,power_law_1.2,3.453945541381836
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,6144,16384,2,8,4,4,power_law_1.2,0.43797760009765624
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,6144,16384,2,8,8,2,balanced,0.09419199824333191
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,6144,16384,2,8,8,2,balanced,0.12277332941691081
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,6144,16384,2,8,4,4,power_law_1.2,0.5689919948577881
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,6144,16384,2,8,4,4,power_law_1.2,4.0078784942626955
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,6144,16384,2,8,8,2,balanced,0.0938933293024699
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,6144,16384,2,8,8,2,balanced,0.1365653375784556
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,6144,16384,2,8,4,4,power_law_1.2,0.9284480094909668
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,6144,16384,2,8,8,2,balanced,0.1014453371365865
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,6144,16384,2,8,8,2,balanced,0.1606613298257192
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,6144,16384,2,8,4,4,power_law_1.2,5.362041473388672
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,6144,16384,2,8,4,4,power_law_1.2,1.2601920127868653
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,6144,16384,2,8,8,2,balanced,0.116757333278656
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,6144,16384,2,8,8,2,balanced,0.21982399622599283
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,6144,16384,2,8,4,4,power_law_1.2,1.5417023658752442
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,6144,16384,2,8,4,4,power_law_1.2,2.155251121520996
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,6144,16384,2,8,4,4,power_law_1.2,12.446073913574219
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,6144,16384,2,8,8,2,balanced,0.13194132844607034
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,6144,16384,2,8,8,2,balanced,0.3027519981066386
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,6144,16384,2,8,8,2,balanced,0.032485333581765495
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,6144,16384,2,8,4,4,power_law_1.2,3.277324676513672
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,6144,16384,2,8,8,2,balanced,0.17667200167973837
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,6144,16384,2,8,8,2,balanced,0.2556160092353821
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,6144,16384,2,8,8,2,balanced,0.04270400106906891
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,6144,16384,2,8,4,4,power_law_1.2,5.036857604980469
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,6144,16384,2,8,8,2,balanced,0.1959786613782247
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,6144,16384,2,8,8,2,balanced,0.37001065413157147
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,6144,16384,2,8,8,2,balanced,0.06026133398214976
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,6144,16384,2,8,4,4,power_law_1.2,7.08282241821289
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,6144,16384,2,8,8,2,balanced,0.06326933205127716
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,6144,16384,2,8,8,2,balanced,0.28138667345046997
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,6144,16384,2,8,8,2,balanced,0.4683573246002197
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,6144,16384,2,8,4,4,power_law_1.2,10.139993286132812
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,6144,16384,2,8,8,2,balanced,0.06442133088906606
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,6144,16384,2,8,8,2,balanced,0.3556426763534546
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,6144,16384,2,8,8,2,balanced,0.0653706689675649
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,6144,16384,2,8,8,2,balanced,0.6801226933797201
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,6144,16384,2,8,4,4,power_law_1.2,19.827320861816407
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,6144,16384,2,8,8,2,balanced,0.06628799935181935
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,6144,16384,2,8,8,2,balanced,0.5125120083491007
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,6144,16384,2,8,8,2,power_law_1.01,0.054995197057724
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,6144,16384,2,8,8,2,balanced,0.8894879817962646
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,6144,16384,2,8,8,2,balanced,0.06549866497516632
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,6144,16384,2,8,8,2,balanced,0.6675626436869303
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,6144,16384,2,8,8,2,power_law_1.01,0.07030400037765502
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,6144,16384,2,8,8,2,balanced,1.3149706522623699
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,6144,16384,2,8,8,2,power_law_1.01,0.06383360028266907
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,6144,16384,2,8,8,2,power_law_1.01,0.09559040069580078
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,6144,16384,2,8,8,2,balanced,0.9824960231781006
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,6144,16384,2,8,8,2,balanced,0.06850666801134746
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,6144,16384,2,8,8,2,power_law_1.01,0.09763200283050537
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,6144,16384,2,8,8,2,balanced,1.7568480173746746
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,6144,16384,2,8,8,2,balanced,0.06985599795977275
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,6144,16384,2,8,8,2,power_law_1.01,0.10118399858474732
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,6144,16384,2,8,8,2,balanced,1.2871733506520588
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,6144,16384,2,8,8,2,power_law_1.01,0.10848000049591064
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,6144,16384,2,8,8,2,power_law_1.01,0.046937599778175354
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,6144,16384,2,8,8,2,power_law_1.01,0.11361279487609863
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,6144,16384,2,8,8,2,balanced,2.1997440656026206
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,6144,16384,2,8,8,2,power_law_1.01,0.05432320237159729
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,6144,16384,2,8,8,2,power_law_1.01,0.11579519510269165
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,6144,16384,2,8,8,2,balanced,1.599082628885905
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,6144,16384,2,8,8,2,power_law_1.01,0.05368319749832153
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,6144,16384,2,8,8,2,power_law_1.01,0.1204800009727478
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,6144,16384,2,8,8,2,power_law_1.01,0.06713600158691406
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,6144,16384,2,8,8,2,power_law_1.01,0.1217087984085083
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,6144,16384,2,8,8,2,power_law_1.01,0.04391680061817169
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,6144,16384,2,8,8,2,balanced,0.07181866466999054
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,6144,16384,2,8,8,2,power_law_1.01,0.06731520295143127
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,6144,16384,2,8,8,2,power_law_1.01,0.12448639869689941
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,6144,16384,2,8,8,2,balanced,3.4083998998006186
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,6144,16384,2,8,8,2,power_law_1.01,0.042745599150657655
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,6144,16384,2,8,8,2,power_law_1.01,0.06951680183410644
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,6144,16384,2,8,8,2,balanced,0.07439466814200084
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,6144,16384,2,8,8,2,power_law_1.01,0.1267135977745056
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,6144,16384,2,8,8,2,power_law_1.01,0.04565759897232056
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,6144,16384,2,8,8,2,balanced,2.5019787152608237
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,6144,16384,2,8,8,2,power_law_1.01,0.1462656021118164
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,6144,16384,2,8,8,2,balanced,0.07718400160471599
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,6144,16384,2,8,8,2,power_law_1.01,0.07500799894332885
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,6144,16384,2,8,8,2,power_law_1.01,0.06359040141105651
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,6144,16384,2,8,8,2,power_law_1.01,0.17424639463424682
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,6144,16384,2,8,8,2,power_law_1.01,0.07634559869766236
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,6144,16384,2,8,8,2,balanced,0.07851733267307281
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,6144,16384,2,8,8,2,power_law_1.01,0.06497920155525208
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,6144,16384,2,8,8,2,power_law_1.01,0.1686079978942871
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,6144,16384,2,8,8,2,power_law_1.01,0.07774720191955567
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,6144,16384,2,8,8,2,power_law_1.01,0.06958720088005066
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,6144,16384,2,8,8,2,power_law_1.01,0.17972480058670043
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,6144,16384,2,8,8,2,power_law_1.01,0.07756159901618957
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,6144,16384,2,8,8,2,power_law_1.01,0.07685760259628296
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,6144,16384,2,8,8,2,power_law_1.01,0.22655999660491943
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,6144,16384,2,8,8,2,power_law_1.01,0.08064640164375306
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,6144,16384,2,8,8,2,balanced,0.09083732962608337
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,6144,16384,2,8,8,2,power_law_1.01,0.07975040078163147
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,6144,16384,2,8,8,2,power_law_1.01,0.3028991937637329
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,6144,16384,2,8,8,2,power_law_1.01,0.0902079999446869
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,6144,16384,2,8,8,2,balanced,6.724389394124349
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,6144,16384,2,8,8,2,balanced,0.09384533762931824
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,6144,16384,2,8,8,2,power_law_1.01,0.08831359744071961
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,6144,16384,2,8,8,2,power_law_1.01,0.3867136001586914
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,6144,16384,2,8,8,2,balanced,0.10026666522026062
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,6144,16384,2,8,8,2,balanced,4.916831970214844
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,6144,16384,2,8,8,2,power_law_1.01,0.10531200170516967
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,6144,16384,2,8,8,2,power_law_1.01,0.4096191883087158
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,6144,16384,2,8,8,2,power_law_1.01,0.08117759823799134
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,6144,16384,2,8,8,2,balanced,0.13620799779891968
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,6144,16384,2,8,8,2,power_law_1.01,0.11856000423431397
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,6144,16384,2,8,8,2,power_law_1.01,0.6425343990325928
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,6144,16384,2,8,8,2,power_law_1.01,0.08488960266113281
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,6144,16384,2,8,8,2,balanced,0.14804266889890036
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,6144,16384,2,8,8,2,power_law_1.01,0.11975040435791015
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,6144,16384,2,8,8,2,power_law_1.01,0.7734720230102539
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,6144,16384,2,8,8,2,power_law_1.01,0.13385599851608276
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,6144,16384,2,8,8,2,power_law_1.01,1.1487680435180665
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,6144,16384,2,8,8,2,power_law_1.01,0.08325120210647582
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,6144,16384,2,8,8,2,power_law_1.01,0.1532415986061096
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,6144,16384,2,8,8,2,power_law_1.01,1.5727423667907714
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,6144,16384,2,8,8,2,power_law_1.01,0.08931840062141419
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,6144,16384,2,8,8,2,power_law_1.01,0.1833343982696533
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,6144,16384,2,8,8,2,balanced,0.20683199167251587
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,6144,16384,2,8,8,2,power_law_1.01,1.871558380126953
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,6144,16384,2,8,8,2,power_law_1.01,0.09516800045967103
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,6144,16384,2,8,8,2,power_law_1.01,0.2508608102798462
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,6144,16384,2,8,8,2,balanced,0.27248533566792804
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,6144,16384,2,8,8,2,power_law_1.01,2.601152038574219
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,6144,16384,2,8,8,2,power_law_1.01,0.10375679731369018
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,6144,16384,2,8,8,2,power_law_1.01,0.26751999855041503
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,6144,16384,2,8,8,2,power_law_1.01,2.7589120864868164
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,6144,16384,2,8,8,2,balanced,0.41009068489074707
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,6144,16384,2,8,8,2,power_law_1.01,0.11854720115661621
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,6144,16384,2,8,8,2,power_law_1.01,0.42304000854492185
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,6144,16384,2,8,8,2,balanced,0.5343519846598307
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,6144,16384,2,8,8,2,power_law_1.01,5.000985717773437
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,6144,16384,2,8,8,2,power_law_1.01,0.11892479658126831
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,6144,16384,2,8,8,2,power_law_1.01,0.5419712066650391
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,6144,16384,2,8,8,2,power_law_1.01,0.7112448215484619
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,6144,16384,2,8,8,2,power_law_1.01,0.13125760555267335
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,6144,16384,2,8,8,2,balanced,0.8109386761983236
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,6144,16384,2,8,8,2,power_law_1.01,10.635878753662109
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,6144,16384,2,8,8,2,power_law_1.01,0.17153279781341552
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,6144,16384,2,8,8,2,power_law_1.01,0.9642304420471192
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,6144,16384,2,8,8,2,balanced,1.0714826583862305
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,6144,16384,2,8,8,2,power_law_1.01,0.2181312084197998
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,6144,16384,2,8,8,2,power_law_1.01,1.262169647216797
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,6144,16384,2,8,8,2,power_law_1.01,1.9636415481567382
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,6144,16384,2,8,8,2,balanced,1.5996586481730144
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,6144,16384,2,8,8,2,power_law_1.01,0.32346880435943604
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,6144,16384,2,8,8,2,power_law_1.01,2.378188705444336
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,6144,16384,2,8,8,2,power_law_1.01,0.4100031852722168
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,6144,16384,2,8,8,2,power_law_1.01,3.8555648803710936
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,6144,16384,2,8,8,2,power_law_1.01,0.6366464138031006
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,6144,16384,2,8,8,2,balanced,2.1141494115193686
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,6144,16384,2,8,8,2,power_law_1.01,0.8569536209106445
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,6144,16384,2,8,8,2,power_law_1.01,6.577247619628906
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,6144,16384,2,8,8,2,power_law_1.01,1.0800127983093262
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,6144,16384,2,8,8,2,balanced,2.6263893445332847
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,6144,16384,2,8,8,2,power_law_1.01,1.6864831924438477
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,6144,16384,2,8,8,2,power_law_1.01,2.8483776092529296
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,6144,16384,2,8,8,2,power_law_1.01,3.2898880004882813
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,6144,16384,2,8,8,2,balanced,4.189557393391927
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,6144,16384,2,8,8,2,power_law_1.01,4.377248001098633
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,6144,16384,2,8,8,2,power_law_1.2,0.06064000129699707
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,6144,16384,2,8,8,2,power_law_1.01,6.209510421752929
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,6144,16384,2,8,8,2,power_law_1.2,0.060089600086212155
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,6144,16384,2,8,8,2,power_law_1.01,12.817280578613282
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,6144,16384,2,8,8,2,power_law_1.2,0.0821183979511261
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,6144,16384,2,8,8,2,power_law_1.2,0.09763839840888977
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,6144,16384,2,8,8,2,power_law_1.2,0.09800320267677307
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,6144,16384,2,8,8,2,power_law_1.2,0.10180480480194092
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,6144,16384,2,8,8,2,balanced,8.340351740519205
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,6144,16384,2,8,8,2,power_law_1.2,0.10776319503784179
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,6144,16384,2,8,8,2,power_law_1.2,0.11441919803619385
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,6144,16384,2,8,8,2,power_law_1.2,0.04881280064582825
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,6144,16384,2,8,8,2,power_law_1.2,0.11416959762573242
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,6144,16384,2,8,8,2,power_law_1.2,0.11783039569854736
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,6144,16384,2,8,8,2,power_law_1.2,0.04739840030670166
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,6144,16384,2,8,8,2,power_law_1.2,0.12012799978256225
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,6144,16384,2,8,8,2,power_law_1.2,0.04902400076389313
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,6144,16384,2,8,8,2,power_law_1.2,0.12528640031814575
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,6144,16384,2,8,8,2,power_law_1.2,0.06644480228424073
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,6144,16384,2,8,8,2,power_law_1.2,0.13428479433059692
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,6144,16384,2,8,8,2,power_law_1.2,0.06658560037612915
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,6144,16384,2,8,8,2,power_law_1.2,0.14419840574264525
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,6144,16384,2,8,8,2,power_law_1.2,0.07200639843940734
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,6144,16384,2,8,8,2,power_law_1.2,0.16266239881515504
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,6144,16384,2,8,8,2,power_law_1.2,0.07427200078964233
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,6144,16384,2,8,8,2,power_law_1.2,0.17375359535217286
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,6144,16384,2,8,8,2,power_law_1.2,0.07470719814300537
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,6144,16384,2,8,8,2,power_law_1.2,0.16981760263442994
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,6144,16384,2,8,8,2,power_law_1.2,0.07635200023651123
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,6144,16384,2,8,8,2,power_law_1.2,0.22571520805358886
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,6144,16384,2,8,8,2,power_law_1.2,0.07827200293540955
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,6144,16384,2,8,8,2,power_law_1.2,0.29409921169281006
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,6144,16384,2,8,8,2,power_law_1.2,0.08484479784965515
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,6144,16384,2,8,8,2,power_law_1.2,0.08848000168800355
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,6144,16384,2,8,8,2,power_law_1.2,0.39070720672607423
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,6144,16384,2,8,8,2,power_law_1.2,0.08811519742012024
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,6144,16384,2,8,8,2,power_law_1.2,0.3751552104949951
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,6144,16384,2,8,8,2,power_law_1.2,0.10589439868927002
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,6144,16384,2,8,8,2,power_law_1.2,0.5312448024749756
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,6144,16384,2,8,8,2,power_law_1.2,0.11252479553222657
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,6144,16384,2,8,8,2,power_law_1.2,0.7813759803771972
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,6144,16384,2,8,8,2,power_law_1.2,0.11820160150527954
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,6144,16384,2,8,8,2,power_law_1.2,1.1005311965942384
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,6144,16384,2,8,8,2,power_law_1.2,0.1252671957015991
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,6144,16384,2,8,8,2,power_law_1.2,1.4949952125549317
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,6144,16384,2,8,8,2,power_law_1.2,0.1602687954902649
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,6144,16384,2,8,8,2,power_law_1.2,1.8436544418334961
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,6144,16384,2,8,8,2,power_law_1.2,0.1800384044647217
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,6144,16384,2,8,16,1,balanced,0.05085866649945577
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,6144,16384,2,8,8,2,power_law_1.2,0.24359679222106934
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,6144,16384,2,8,8,2,power_law_1.2,2.713376045227051
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,6144,16384,2,8,8,2,power_law_1.2,0.3170880079269409
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,6144,16384,2,8,16,1,balanced,0.06346666812896729
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,6144,16384,2,8,8,2,power_law_1.2,3.975513458251953
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,6144,16384,2,8,8,2,power_law_1.2,0.36389119625091554
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,6144,16384,2,8,16,1,balanced,0.09678933024406433
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,6144,16384,2,8,8,2,power_law_1.2,0.042105600237846375
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,6144,16384,2,8,8,2,power_law_1.2,6.148652648925781
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,6144,16384,2,8,8,2,power_law_1.2,0.5166592121124267
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,6144,16384,2,8,16,1,balanced,0.0977280040582021
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,6144,16384,2,8,8,2,power_law_1.2,0.042777600884437564
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,6144,16384,2,8,8,2,power_law_1.2,0.6675392150878906
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,6144,16384,2,8,16,1,balanced,0.09901866316795349
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,6144,16384,2,8,8,2,power_law_1.2,0.04844799935817719
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,6144,16384,2,8,8,2,power_law_1.2,11.510797119140625
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,6144,16384,2,8,8,2,power_law_1.2,0.06238719820976257
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,6144,16384,2,8,16,1,balanced,0.09974400202433269
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,6144,16384,2,8,8,2,power_law_1.2,1.0167936325073241
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,6144,16384,2,8,8,2,power_law_1.2,0.06264320015907288
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,6144,16384,2,8,16,1,balanced,0.10086400310198466
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,6144,16384,2,8,8,2,power_law_1.2,0.06803200244903565
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,6144,16384,2,8,8,2,power_law_1.2,1.5906047821044922
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,6144,16384,2,8,8,2,power_law_1.2,0.07564799785614014
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,6144,16384,2,8,16,1,balanced,0.10121599833170573
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,6144,16384,2,8,8,2,power_law_1.2,1.8278528213500977
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,6144,16384,2,8,8,2,power_law_1.2,0.0776639997959137
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,6144,16384,2,8,16,1,balanced,0.10436800122261047
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,6144,16384,2,8,8,2,power_law_1.2,2.523302459716797
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,6144,16384,2,8,16,1,balanced,0.10442666212717693
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,6144,16384,2,8,8,2,power_law_1.2,0.07988479733467102
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,6144,16384,2,8,8,2,power_law_1.2,3.9232128143310545
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,6144,16384,2,8,16,1,balanced,0.10689066847165425
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,6144,16384,2,8,8,2,power_law_1.2,0.08292480111122132
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,6144,16384,2,8,16,1,balanced,0.10945066809654236
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,6144,16384,2,8,8,2,power_law_1.2,7.7046974182128904
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,6144,16384,2,8,16,1,balanced,0.11162666479746501
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,6144,16384,2,8,16,1,balanced,0.03734933336575826
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,6144,16384,2,8,8,2,power_law_1.2,0.08819199800491333
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,6144,16384,2,8,16,1,balanced,0.1188106636206309
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,6144,16384,2,8,8,2,power_law_1.2,0.09368320107460022
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,6144,16384,2,8,16,1,balanced,0.049135997891426086
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,6144,16384,2,8,8,2,power_law_1.2,0.09544960260391236
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,6144,16384,2,8,16,1,balanced,0.1276746690273285
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,6144,16384,2,8,8,2,power_law_1.2,0.10204800367355346
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,6144,16384,2,8,16,1,balanced,0.06482666730880737
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,6144,16384,2,8,16,1,balanced,0.1280693312486013
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,6144,16384,2,8,16,1,balanced,0.0679253339767456
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,6144,16384,2,8,8,2,power_law_1.2,0.11938560009002686
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,6144,16384,2,8,16,1,balanced,0.06937600175539653
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,6144,16384,2,8,8,2,power_law_1.2,0.12271360158920289
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,6144,16384,2,8,16,1,balanced,0.14705066879590353
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,6144,16384,2,8,8,2,power_law_1.2,0.14489599466323852
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,6144,16384,2,8,16,1,balanced,0.07019199927647908
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,6144,16384,2,8,16,1,balanced,0.16658666729927063
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,6144,16384,2,8,8,2,power_law_1.2,0.1795904040336609
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,6144,16384,2,8,16,1,balanced,0.07063466807206471
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,6144,16384,2,8,8,2,power_law_1.2,0.21269121170043945
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,6144,16384,2,8,16,1,balanced,0.1813973387082418
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,6144,16384,2,8,16,1,balanced,0.07145600020885468
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,6144,16384,2,8,8,2,power_law_1.2,0.3566528081893921
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,6144,16384,2,8,16,1,balanced,0.2479733427365621
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,6144,16384,2,8,16,1,balanced,0.07246399919191997
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,6144,16384,2,8,8,2,power_law_1.2,0.4043327808380127
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,6144,16384,2,8,8,2,power_law_1.2,0.6759103775024414
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,6144,16384,2,8,16,1,balanced,0.34460266431172687
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,6144,16384,2,8,16,1,balanced,0.07373866438865662
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,6144,16384,2,8,8,2,power_law_1.2,0.7195648193359375
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,6144,16384,2,8,16,1,balanced,0.07578666508197784
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,6144,16384,2,8,16,1,balanced,0.4676320155461629
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,6144,16384,2,8,8,2,power_law_1.2,1.2079872131347655
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,6144,16384,2,8,16,1,balanced,0.0793333351612091
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,6144,16384,2,8,8,2,power_law_1.2,1.5953280448913574
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,6144,16384,2,8,16,1,balanced,0.5347466468811035
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,6144,16384,2,8,8,2,power_law_1.2,2.808691215515137
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,6144,16384,2,8,16,1,balanced,0.08086400230725606
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,6144,16384,2,8,8,2,power_law_1.2,3.500089645385742
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,6144,16384,2,8,16,1,balanced,0.08742933471997578
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,6144,16384,2,8,16,1,balanced,0.7837546666463217
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,6144,16384,2,8,16,1,balanced,0.09521599610646565
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,6144,16384,2,8,16,1,balanced,0.03387733300526937
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,6144,16384,2,8,8,2,power_law_1.2,4.305427169799804
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,6144,16384,2,8,16,1,balanced,0.0962666670481364
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,6144,16384,2,8,16,1,balanced,0.04438933233420054
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,6144,16384,2,8,16,1,balanced,1.0223626295725505
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,6144,16384,2,8,8,2,power_law_1.2,7.270086669921875
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,6144,16384,2,8,16,1,balanced,0.11357333262761433
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,6144,16384,2,8,16,1,balanced,0.06154666841030121
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,6144,16384,2,8,8,2,power_law_1.2,13.313273620605468
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,6144,16384,2,8,16,1,balanced,0.13270399967829385
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,6144,16384,2,8,16,1,balanced,0.06424533327420552
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,6144,16384,2,8,16,1,balanced,1.5131999651590984
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,6144,16384,2,8,16,1,balanced,0.14251200358072916
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,6144,16384,2,8,16,1,balanced,0.06609599788983662
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,6144,16384,2,8,16,1,balanced,0.06709333260854085
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,6144,16384,2,8,16,1,balanced,0.19503466288248697
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,6144,16384,2,8,16,1,power_law_1.01,0.04966399967670441
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,6144,16384,2,8,16,1,balanced,1.9984159469604492
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,6144,16384,2,8,16,1,balanced,0.06845866640408833
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,6144,16384,2,8,16,1,balanced,0.24237332741419473
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,6144,16384,2,8,16,1,power_law_1.01,0.05433599948883057
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,6144,16384,2,8,16,1,power_law_1.01,0.03944959938526153
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,6144,16384,2,8,16,1,balanced,0.06931733091672261
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,6144,16384,2,8,16,1,balanced,0.34679468472798664
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,6144,16384,2,8,16,1,power_law_1.01,0.06344320178031922
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,6144,16384,2,8,16,1,power_law_1.01,0.043219199776649474
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,6144,16384,2,8,16,1,balanced,2.49507729212443
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,6144,16384,2,8,16,1,power_law_1.01,0.09681919813156128
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,6144,16384,2,8,16,1,balanced,0.4349173307418823
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,6144,16384,2,8,16,1,power_law_1.01,0.046419200301170346
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,6144,16384,2,8,16,1,power_law_1.01,0.0961023986339569
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,6144,16384,2,8,16,1,balanced,0.6391839981079102
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,6144,16384,2,8,16,1,power_law_1.01,0.10068479776382447
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,6144,16384,2,8,16,1,power_law_1.01,0.0659712016582489
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,6144,16384,2,8,16,1,balanced,0.0730560024579366
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,6144,16384,2,8,16,1,power_law_1.01,0.10682879686355591
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,6144,16384,2,8,16,1,power_law_1.01,0.06843519806861878
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,6144,16384,2,8,16,1,balanced,0.8188479741414388
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,6144,16384,2,8,16,1,power_law_1.01,0.109990394115448
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,6144,16384,2,8,16,1,power_law_1.01,0.0741312026977539
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,6144,16384,2,8,16,1,balanced,0.0740479975938797
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,6144,16384,2,8,16,1,balanced,3.9305760065714517
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,6144,16384,2,8,16,1,power_law_1.01,0.526636791229248
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,6144,16384,2,8,16,1,power_law_1.01,0.0756991982460022
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,6144,16384,2,8,16,1,balanced,1.1910719871520996
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,6144,16384,2,8,16,1,power_law_1.01,0.5271743774414063
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,6144,16384,2,8,16,1,power_law_1.01,0.07736960053443909
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,6144,16384,2,8,16,1,power_law_1.01,0.12319999933242798
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,6144,16384,2,8,16,1,power_law_1.01,0.07941759824752807
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,6144,16384,2,8,16,1,power_law_1.01,0.1248703956604004
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,6144,16384,2,8,16,1,balanced,1.591909408569336
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,6144,16384,2,8,16,1,power_law_1.01,0.08016639947891235
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,6144,16384,2,8,16,1,power_law_1.01,0.1265727996826172
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,6144,16384,2,8,16,1,power_law_1.01,0.08240640163421631
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,6144,16384,2,8,16,1,power_law_1.01,0.15262080430984498
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,6144,16384,2,8,16,1,balanced,0.07940799991289775
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,6144,16384,2,8,16,1,power_law_1.01,0.0864512026309967
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,6144,16384,2,8,16,1,power_law_1.01,0.15589120388031005
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,6144,16384,2,8,16,1,balanced,1.9855626424153645
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,6144,16384,2,8,16,1,balanced,7.682773590087891
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,6144,16384,2,8,16,1,balanced,0.08366933465003967
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,6144,16384,2,8,16,1,power_law_1.01,0.08774399757385254
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,6144,16384,2,8,16,1,power_law_1.01,0.15742080211639403
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,6144,16384,2,8,16,1,balanced,0.08646399776140849
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,6144,16384,2,8,16,1,power_law_1.01,0.10408960580825806
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,6144,16384,2,8,16,1,power_law_1.01,0.20841600894927978
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,6144,16384,2,8,16,1,balanced,0.09096533060073853
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,6144,16384,2,8,16,1,power_law_1.01,0.11153279542922974
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,6144,16384,2,8,16,1,power_law_1.01,0.2256319999694824
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,6144,16384,2,8,16,1,balanced,0.10660266876220703
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,6144,16384,2,8,16,1,balanced,3.072277386983236
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,6144,16384,2,8,16,1,power_law_1.01,0.11304320096969604
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,6144,16384,2,8,16,1,power_law_1.01,0.22970879077911377
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,6144,16384,2,8,16,1,balanced,0.1114453375339508
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,6144,16384,2,8,16,1,power_law_1.01,0.11784960031509399
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,6144,16384,2,8,16,1,power_law_1.01,0.2943552017211914
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,6144,16384,2,8,16,1,balanced,0.1218346655368805
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,6144,16384,2,8,16,1,power_law_1.01,0.1538815975189209
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,6144,16384,2,8,16,1,power_law_1.01,0.35300478935241697
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,6144,16384,2,8,16,1,balanced,0.17377599080403647
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,6144,16384,2,8,16,1,power_law_1.01,0.5091392040252686
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,6144,16384,2,8,16,1,power_law_1.01,0.16931840181350707
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,6144,16384,2,8,16,1,balanced,0.20087466637293497
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,6144,16384,2,8,16,1,power_law_1.01,0.5940224170684815
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,6144,16384,2,8,16,1,power_law_1.01,0.21955199241638185
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,6144,16384,2,8,16,1,power_law_1.01,0.2683840036392212
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,6144,16384,2,8,16,1,power_law_1.01,0.8126015663146973
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,6144,16384,2,8,16,1,balanced,0.30050132671991986
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,6144,16384,2,8,16,1,power_law_1.01,0.3700031995773315
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,6144,16384,2,8,16,1,power_law_1.01,1.0586048126220704
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,6144,16384,2,8,16,1,balanced,6.0436585744222
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,6144,16384,2,8,16,1,balanced,0.3933653434117635
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,6144,16384,2,8,16,1,power_law_1.01,0.4641791820526123
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,6144,16384,2,8,16,1,power_law_1.01,1.5026880264282227
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,6144,16384,2,8,16,1,balanced,0.5749066670735677
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,6144,16384,2,8,16,1,power_law_1.01,0.6580287933349609
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,6144,16384,2,8,16,1,power_law_1.01,2.0281471252441405
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,6144,16384,2,8,16,1,balanced,0.7495466868082682
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,6144,16384,2,8,16,1,power_law_1.01,0.8145919799804687
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,6144,16384,2,8,16,1,power_law_1.01,2.5544063568115236
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,6144,16384,2,8,16,1,power_law_1.01,1.2151359558105468
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,6144,16384,2,8,16,1,balanced,1.126757303873698
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,6144,16384,2,8,16,1,power_law_1.01,3.8613441467285154
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,6144,16384,2,8,16,1,power_law_1.01,1.601759910583496
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,6144,16384,2,8,16,1,balanced,1.4788373311360676
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,6144,16384,2,8,16,1,power_law_1.01,7.640646362304688
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,6144,16384,2,8,16,1,power_law_1.01,2.0042751312255858
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,6144,16384,2,8,16,1,power_law_1.01,0.03553279936313629
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,6144,16384,2,8,16,1,power_law_1.01,3.083769607543945
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,6144,16384,2,8,16,1,power_law_1.01,0.039366400241851805
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,6144,16384,2,8,16,1,balanced,2.2208639780680337
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,6144,16384,2,8,16,1,power_law_1.01,0.04636160135269165
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,6144,16384,2,8,16,1,power_law_1.01,6.055238342285156
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,6144,16384,2,8,16,1,power_law_1.01,0.06161919832229614
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,6144,16384,2,8,16,1,power_law_1.01,0.06314880251884461
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,6144,16384,2,8,16,1,balanced,2.9467039108276367
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,6144,16384,2,8,16,1,power_law_1.2,0.04956159889698029
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,6144,16384,2,8,16,1,power_law_1.01,0.07230079770088196
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,6144,16384,2,8,16,1,power_law_1.2,0.054636800289154054
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,6144,16384,2,8,16,1,power_law_1.01,0.0739135980606079
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,6144,16384,2,8,16,1,power_law_1.2,0.06505600214004517
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,6144,16384,2,8,16,1,power_law_1.01,0.07616000175476074
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,6144,16384,2,8,16,1,balanced,3.6592321395874023
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,6144,16384,2,8,16,1,power_law_1.2,0.09575039744377137
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,6144,16384,2,8,16,1,power_law_1.2,0.09833599925041199
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,6144,16384,2,8,16,1,power_law_1.01,0.08275840282440186
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,6144,16384,2,8,16,1,power_law_1.2,0.10053119659423829
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,6144,16384,2,8,16,1,power_law_1.01,0.08361600041389465
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,6144,16384,2,8,16,1,balanced,5.859743754069011
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,6144,16384,2,8,16,1,power_law_1.2,0.10250240564346313
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,6144,16384,2,8,16,1,power_law_1.2,0.10933120250701904
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,6144,16384,2,8,16,1,power_law_1.01,0.089055997133255
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,6144,16384,2,8,16,1,power_law_1.2,0.31889920234680175
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,6144,16384,2,8,16,1,power_law_1.01,0.09283199906349182
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,6144,16384,2,8,16,1,power_law_1.2,0.9387904167175293
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,6144,16384,2,8,16,1,power_law_1.2,0.03826560080051422
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,6144,16384,2,8,16,1,power_law_1.01,0.09651200175285339
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,6144,16384,2,8,16,1,power_law_1.2,0.11960320472717285
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,6144,16384,2,8,16,1,power_law_1.2,0.042099198698997496
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,6144,16384,2,8,16,1,power_law_1.01,0.10241279602050782
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,6144,16384,2,8,16,1,power_law_1.2,0.12392959594726563
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,6144,16384,2,8,16,1,power_law_1.2,0.047091200947761536
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,6144,16384,2,8,16,1,power_law_1.2,0.0654911994934082
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,6144,16384,2,8,16,1,power_law_1.01,0.12358399629592895
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,6144,16384,2,8,16,1,power_law_1.2,0.12604160308837892
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,6144,16384,2,8,16,1,power_law_1.2,0.06652799844741822
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,6144,16384,2,8,16,1,balanced,11.685258229573568
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,6144,16384,2,8,16,1,power_law_1.01,0.12702080011367797
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,6144,16384,2,8,16,1,power_law_1.2,0.0747327983379364
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,6144,16384,2,8,16,1,power_law_1.2,0.1491520047187805
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,6144,16384,2,8,16,1,power_law_1.2,0.07442560195922851
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,6144,16384,2,8,16,1,power_law_1.01,0.1459712028503418
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,6144,16384,2,8,16,1,power_law_1.2,0.07633280158042907
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,6144,16384,2,8,16,1,power_law_1.2,0.15170559883117676
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,6144,16384,2,8,16,1,power_law_1.2,0.07889919877052307
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,6144,16384,2,8,16,1,power_law_1.01,0.19088000059127808
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,6144,16384,2,8,16,1,power_law_1.2,0.16058239936828614
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,6144,16384,2,8,16,1,power_law_1.2,0.08032000064849854
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,6144,16384,2,8,16,1,power_law_1.2,0.08197759985923767
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,6144,16384,2,8,16,1,power_law_1.01,0.22644479274749757
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,6144,16384,2,8,16,1,power_law_1.2,0.08551679849624634
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,6144,16384,2,8,16,1,power_law_1.2,0.2125312089920044
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,6144,16384,2,8,16,1,power_law_1.01,0.3301568031311035
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,6144,16384,2,8,16,1,power_law_1.2,0.08770560026168824
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,6144,16384,2,8,16,1,power_law_1.2,0.2270656108856201
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,6144,16384,2,8,16,1,power_law_1.2,0.10312960147857667
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,6144,16384,2,8,16,1,power_law_1.01,0.4176447868347168
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,6144,16384,2,8,16,1,power_law_1.2,0.11027840375900269
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,6144,16384,2,8,16,1,power_law_1.2,0.2263808012008667
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,6144,16384,2,8,16,1,power_law_1.2,0.11214720010757447
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,6144,16384,2,8,16,1,power_law_1.01,0.6016255855560303
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,6144,16384,2,8,16,1,power_law_1.2,0.11784960031509399
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,6144,16384,2,8,16,1,power_law_1.2,0.29663360118865967
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,6144,16384,2,8,16,1,power_law_1.2,0.1539520025253296
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,6144,16384,2,8,16,1,power_law_1.01,0.7821568012237549
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,6144,16384,2,8,16,1,power_law_1.2,0.374399995803833
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,6144,16384,2,8,16,1,power_law_1.2,0.16622079610824586
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,6144,16384,2,8,16,1,power_law_1.01,1.1536831855773926
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,6144,16384,2,8,16,1,power_law_1.2,0.22035839557647705
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,6144,16384,2,8,16,1,power_law_1.2,0.4750976085662842
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,6144,16384,2,8,16,1,power_law_1.2,0.27044479846954345
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,6144,16384,2,8,16,1,power_law_1.01,1.5244352340698242
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,6144,16384,2,8,16,1,power_law_1.2,0.596895980834961
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,6144,16384,2,8,16,1,power_law_1.2,0.3683455944061279
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,6144,16384,2,8,16,1,power_law_1.01,2.2350719451904295
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,6144,16384,2,8,16,1,power_law_1.2,0.8290880203247071
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,6144,16384,2,8,16,1,power_law_1.2,0.4607679843902588
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,6144,16384,2,8,16,1,power_law_1.01,2.9636735916137695
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,6144,16384,2,8,16,1,power_law_1.2,1.046463966369629
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,6144,16384,2,8,16,1,power_law_1.2,0.6566656112670899
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,6144,16384,2,8,16,1,power_law_1.2,0.828006362915039
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,6144,16384,2,8,16,1,power_law_1.01,3.6974464416503907
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,6144,16384,2,8,16,1,power_law_1.2,1.4959424018859864
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,6144,16384,2,8,16,1,power_law_1.2,1.2054080009460448
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,6144,16384,2,8,16,1,power_law_1.2,2.0430976867675783
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,6144,16384,2,8,16,1,power_law_1.2,1.6079231262207032
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,6144,16384,2,8,16,1,power_law_1.01,5.877727890014649
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,6144,16384,2,8,16,1,power_law_1.2,2.021830368041992
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,6144,16384,2,8,16,1,power_law_1.2,2.559712028503418
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,6144,16384,2,8,16,1,power_law_1.2,3.0706623077392576
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,6144,16384,2,8,16,1,power_law_1.01,11.742578887939453
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,6144,16384,2,8,16,1,power_law_1.2,3.8723968505859374
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,6144,16384,2,8,16,1,power_law_1.2,6.040505599975586
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,6144,16384,2,8,16,1,power_law_1.2,7.607878112792969
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,6144,16384,2,8,16,1,power_law_1.2,0.03459199965000152
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,6144,16384,2,8,16,1,power_law_1.2,0.03896960020065308
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,6144,16384,2,8,16,1,power_law_1.2,0.043244799971580504
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,6144,16384,2,8,16,1,power_law_1.2,0.06330879926681518
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,6144,16384,2,8,16,1,power_law_1.2,0.06325119733810425
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,6144,16384,2,8,16,1,power_law_1.2,0.07153279781341552
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,6144,16384,2,8,16,1,power_law_1.2,0.07516160011291503
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,6144,16384,2,8,16,1,power_law_1.2,0.07731199860572815
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,6144,16384,2,8,16,1,power_law_1.2,0.08149120211601257
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,6144,16384,2,8,16,1,power_law_1.2,0.08420479893684388
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,6144,16384,2,8,16,1,power_law_1.2,0.09160320162773132
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,6144,16384,2,8,16,1,power_law_1.2,0.09404799938201905
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,6144,16384,2,8,16,1,power_law_1.2,0.09903360009193421
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,6144,16384,2,8,16,1,power_law_1.2,0.10461440086364746
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,6144,16384,2,8,16,1,power_law_1.2,0.12344959974288941
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,6144,16384,2,8,16,1,power_law_1.2,0.13056639432907105
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,6144,16384,2,8,16,1,power_law_1.2,0.14350080490112305
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,6144,16384,2,8,16,1,power_law_1.2,0.19095040559768678
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,6144,16384,2,8,16,1,power_law_1.2,0.22675199508666993
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,6144,16384,2,8,16,1,power_law_1.2,0.33124480247497556
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,6144,16384,2,8,16,1,power_law_1.2,0.4225791931152344
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,6144,16384,2,8,16,1,power_law_1.2,0.5971839904785157
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,6144,16384,2,8,16,1,power_law_1.2,0.7805759906768799
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,7168,2048,8,256,1,16,balanced,0.0819413314263026
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,6144,16384,2,8,16,1,power_law_1.2,1.1490880012512208
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,7168,2048,8,256,1,16,balanced,0.07939200103282928
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,6144,16384,2,8,16,1,power_law_1.2,1.497433567047119
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,7168,2048,8,256,1,16,balanced,0.0813973347345988
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,6144,16384,2,8,16,1,power_law_1.2,2.2299968719482424
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,7168,2048,8,256,1,16,balanced,0.12486933668454488
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,6144,16384,2,8,16,1,power_law_1.2,2.968179130554199
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,7168,2048,8,256,1,16,balanced,0.21075733502705893
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,7168,2048,8,256,1,16,balanced,0.3700480063756307
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,6144,16384,2,8,16,1,power_law_1.2,3.679500961303711
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,7168,2048,8,256,1,16,balanced,0.3689440091451009
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,6144,16384,2,8,16,1,power_law_1.2,5.881631851196289
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,7168,2048,8,256,1,16,balanced,0.36850666999816895
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,7168,2048,8,256,1,16,balanced,0.36934399604797363
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,6144,16384,2,8,16,1,power_law_1.2,11.70483856201172
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,7168,2048,8,256,1,16,balanced,0.3696586688359578
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,7168,2048,8,256,1,16,balanced,0.05719466507434845
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,7168,2048,8,256,1,16,balanced,0.3688053290049235
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,7168,2048,8,256,1,16,balanced,0.06111466884613037
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,7168,2048,8,256,1,16,balanced,0.3699093262354533
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,7168,2048,8,256,1,16,balanced,0.06277866661548615
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,7168,2048,8,256,1,16,balanced,0.36979198455810547
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,7168,2048,8,256,1,16,balanced,0.08747200171152751
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,7168,2048,8,256,1,16,balanced,0.37274666627248126
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,7168,2048,8,256,1,16,balanced,0.1291146675745646
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,7168,2048,8,256,1,16,balanced,0.3781760136286418
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,7168,2048,8,256,1,16,balanced,0.21024533112843832
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,7168,2048,8,256,1,16,balanced,0.379530668258667
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,7168,2048,8,256,1,16,balanced,0.2124639948209127
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,7168,2048,8,256,1,16,balanced,0.05074666440486908
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,7168,2048,8,256,1,16,balanced,0.38556798299153644
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,7168,2048,8,256,1,16,balanced,0.2111519972483317
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,7168,2048,8,256,1,16,balanced,0.05086400111516317
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,7168,2048,8,256,1,16,balanced,0.21363200743993124
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,7168,2048,8,256,1,16,balanced,0.4068959951400757
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,7168,2048,8,256,1,16,balanced,0.061162665486335754
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,7168,2048,8,256,1,16,balanced,0.21303466955820718
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,7168,2048,8,256,1,16,balanced,0.4176959991455078
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,7168,2048,8,256,1,16,balanced,0.09110933542251587
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,7168,2048,8,256,1,16,balanced,0.21715199947357178
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,7168,2048,8,256,1,16,balanced,0.1348960002263387
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,7168,2048,8,256,1,16,balanced,0.21789334217707315
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,7168,2048,8,256,1,16,balanced,0.43297068277994794
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,7168,2048,8,256,1,16,balanced,0.2092693249384562
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,7168,2048,8,256,1,16,balanced,0.22062400976816812
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,7168,2048,8,256,1,16,balanced,0.21114667256673178
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,7168,2048,8,256,1,16,balanced,0.22377600272496542
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,7168,2048,8,256,1,16,balanced,0.46642665068308514
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,7168,2048,8,256,1,16,balanced,0.21206400791803995
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,7168,2048,8,256,1,16,balanced,0.2294399936993917
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,7168,2048,8,256,1,16,balanced,0.2130826711654663
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,7168,2048,8,256,1,16,balanced,0.23259733120600382
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,7168,2048,8,256,1,16,balanced,0.21281067530314127
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,7168,2048,8,256,1,16,balanced,0.4970613320668538
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,7168,2048,8,256,1,16,balanced,0.21459199984868368
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,7168,2048,8,256,1,16,balanced,0.2386773427327474
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,7168,2048,8,256,1,16,balanced,0.21878933906555176
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,7168,2048,8,256,1,16,power_law_1.01,0.22098560333251954
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,7168,2048,8,256,1,16,balanced,0.2518453399340312
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,7168,2048,8,256,1,16,balanced,0.21874666213989258
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,7168,2048,8,256,1,16,balanced,0.5338826576868693
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,7168,2048,8,256,1,16,balanced,0.22123199701309204
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,7168,2048,8,256,1,16,power_law_1.01,0.3734015941619873
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,7168,2048,8,256,1,16,balanced,0.26498132944107056
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,7168,2048,8,256,1,16,power_law_1.01,0.12293119430541992
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,7168,2048,8,256,1,16,balanced,0.22839999198913574
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,7168,2048,8,256,1,16,power_law_1.01,0.15485440492630004
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,7168,2048,8,256,1,16,balanced,0.2892373402913411
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,7168,2048,8,256,1,16,balanced,0.23061867554982504
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,7168,2048,8,256,1,16,balanced,0.6860480308532715
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,7168,2048,8,256,1,16,power_law_1.01,0.1969215989112854
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,7168,2048,8,256,1,16,balanced,0.2376319964726766
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,7168,2048,8,256,1,16,power_law_1.01,0.23168001174926758
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,7168,2048,8,256,1,16,balanced,0.32131733496983844
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,7168,2048,8,256,1,16,power_law_1.01,0.3067647933959961
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,7168,2048,8,256,1,16,power_law_1.01,0.2967423915863037
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,7168,2048,8,256,1,16,balanced,0.36003732681274414
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,7168,2048,8,256,1,16,power_law_1.01,0.31559679508209226
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,7168,2048,8,256,1,16,power_law_1.01,0.31208319664001466
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,7168,2048,8,256,1,16,balanced,0.74290664990743
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,7168,2048,8,256,1,16,power_law_1.01,0.3402623891830444
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,7168,2048,8,256,1,16,balanced,0.255018671353658
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,7168,2048,8,256,1,16,power_law_1.01,0.34358398914337157
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,7168,2048,8,256,1,16,balanced,0.4129973252614339
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,7168,2048,8,256,1,16,power_law_1.01,0.3493567943572998
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,7168,2048,8,256,1,16,power_law_1.01,0.3738176107406616
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,7168,2048,8,256,1,16,power_law_1.01,0.39978880882263185
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,7168,2048,8,256,1,16,power_law_1.01,0.388153600692749
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,7168,2048,8,256,1,16,balanced,0.5432053407033285
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,7168,2048,8,256,1,16,balanced,1.0268747011820476
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,7168,2048,8,256,1,16,power_law_1.01,0.44413437843322756
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,7168,2048,8,256,1,16,power_law_1.01,0.4680448055267334
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,7168,2048,8,256,1,16,power_law_1.01,0.5083712100982666
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,256,1,16,balanced,0.2754240036010742
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,7168,2048,8,256,1,16,power_law_1.01,0.6040512084960937
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,7168,2048,8,256,1,16,balanced,0.6296319961547852
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,7168,2048,8,256,1,16,power_law_1.01,0.5940415859222412
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,256,1,16,balanced,0.3035786747932434
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,7168,2048,8,256,1,16,power_law_1.01,0.6865791797637939
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,7168,2048,8,256,1,16,power_law_1.01,0.8240832328796387
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,256,1,16,balanced,0.32553066809972125
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,7168,2048,8,256,1,16,power_law_1.01,1.017356777191162
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,7168,2048,8,256,1,16,power_law_1.01,0.13293440341949464
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,7168,2048,8,256,1,16,power_law_1.01,1.3255552291870116
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,7168,2048,8,256,1,16,balanced,1.3077279726664226
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,7168,2048,8,256,1,16,power_law_1.01,0.2156991958618164
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,7168,2048,8,256,1,16,power_law_1.2,0.21942400932312012
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,256,1,16,balanced,0.4017546574274699
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,7168,2048,8,256,1,16,power_law_1.01,1.8963071823120117
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,7168,2048,8,256,1,16,power_law_1.01,0.11598080396652222
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,7168,2048,8,256,1,16,balanced,0.8901013533274332
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,7168,2048,8,256,1,16,power_law_1.2,0.3665791988372803
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,7168,2048,8,256,1,16,power_law_1.01,2.389740753173828
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,7168,2048,8,256,1,16,power_law_1.01,0.09556480050086975
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,7168,2048,8,256,1,16,power_law_1.01,0.13303680419921876
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,7168,2048,8,256,1,16,power_law_1.2,0.08549759984016418
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,7168,2048,8,256,1,16,power_law_1.01,2.811142349243164
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,256,1,16,balanced,0.45818666617075604
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,7168,2048,8,256,1,16,power_law_1.01,0.1379520058631897
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,7168,2048,8,256,1,16,power_law_1.2,0.14847999811172485
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,7168,2048,8,256,1,16,power_law_1.01,0.2142335891723633
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,7168,2048,8,256,1,16,power_law_1.01,4.409868621826172
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,7168,2048,8,256,1,16,power_law_1.01,0.15199359655380248
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,7168,2048,8,256,1,16,power_law_1.2,0.18133759498596191
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,7168,2048,8,256,1,16,power_law_1.01,0.11210240125656128
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,7168,2048,8,256,1,16,power_law_1.01,0.18981120586395264
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,7168,2048,8,256,1,16,power_law_1.01,9.475225830078125
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,7168,2048,8,256,1,16,power_law_1.2,0.23724799156188964
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,7168,2048,8,256,1,16,power_law_1.01,0.11056640148162841
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,256,1,16,balanced,0.6840960184733073
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,7168,2048,8,256,1,16,power_law_1.01,0.16864000558853148
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,7168,2048,8,256,1,16,power_law_1.2,0.3035583972930908
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,7168,2048,8,256,1,16,power_law_1.01,0.12136319875717164
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,7168,2048,8,256,1,16,power_law_1.01,0.18801920413970946
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,7168,2048,8,256,1,16,balanced,1.608751932779948
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,7168,2048,8,256,1,16,balanced,1.140448013941447
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,7168,2048,8,256,1,16,power_law_1.2,0.32152960300445554
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,7168,2048,8,256,1,16,power_law_1.01,0.149619197845459
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,7168,2048,8,256,1,16,power_law_1.01,0.18466559648513795
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,7168,2048,8,256,1,16,power_law_1.2,0.3125119924545288
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,7168,2048,8,256,1,16,power_law_1.01,0.18173439502716066
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,256,1,16,balanced,0.7938933372497559
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,7168,2048,8,256,1,16,power_law_1.01,0.18663040399551392
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,7168,2048,8,256,1,16,power_law_1.2,0.3088831901550293
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,7168,2048,8,256,1,16,power_law_1.01,0.19262080192565917
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,7168,2048,8,256,1,16,power_law_1.01,0.19880319833755494
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,7168,2048,8,256,1,16,power_law_1.2,0.3279936075210571
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,7168,2048,8,256,1,16,power_law_1.01,0.19642879962921142
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,7168,2048,8,256,1,16,power_law_1.01,0.21300480365753174
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,7168,2048,8,256,1,16,power_law_1.2,0.3430016040802002
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,7168,2048,8,256,1,16,power_law_1.01,0.1951167941093445
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,7168,2048,8,256,1,16,power_law_1.01,0.2235584020614624
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,7168,2048,8,256,1,16,power_law_1.2,0.3412544012069702
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,7168,2048,8,256,1,16,power_law_1.01,0.2085952043533325
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,7168,2048,8,256,1,16,power_law_1.01,0.2224384069442749
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,7168,2048,8,256,1,16,power_law_1.2,0.3759360074996948
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,256,1,16,balanced,1.1720960140228271
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,7168,2048,8,256,1,16,power_law_1.01,0.2409343957901001
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,7168,2048,8,256,1,16,power_law_1.01,0.21285760402679443
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,7168,2048,8,256,1,16,power_law_1.2,0.4092671871185303
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,7168,2048,8,256,1,16,balanced,1.4000053405761719
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,7168,2048,8,256,1,16,power_law_1.01,0.2543231964111328
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,7168,2048,8,256,1,16,power_law_1.01,0.22622079849243165
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,7168,2048,8,256,1,16,power_law_1.2,0.47129597663879397
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,7168,2048,8,256,1,16,power_law_1.01,0.27799038887023925
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,7168,2048,8,256,1,16,power_law_1.01,0.24508800506591796
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,7168,2048,8,256,1,16,power_law_1.2,0.4326848030090332
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,7168,2048,8,256,1,16,power_law_1.01,0.30078721046447754
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,7168,2048,8,256,1,16,power_law_1.01,0.25858559608459475
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,7168,2048,8,256,1,16,power_law_1.2,0.529804801940918
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,7168,2048,8,256,1,16,power_law_1.01,0.3835200071334839
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,7168,2048,8,256,1,16,power_law_1.2,0.5578303813934327
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,7168,2048,8,256,1,16,power_law_1.01,0.27781119346618655
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,7168,2048,8,256,1,16,balanced,2.507749398549398
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,7168,2048,8,256,1,16,power_law_1.01,0.39908480644226074
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,7168,2048,8,256,1,16,power_law_1.2,0.7205311775207519
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,7168,2048,8,256,1,16,power_law_1.01,0.30398080348968504
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,7168,2048,8,256,1,16,power_law_1.01,0.4920512199401855
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,256,1,16,balanced,1.5488959948221843
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,7168,2048,8,256,1,16,power_law_1.2,0.6596288204193115
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,7168,2048,8,256,1,16,power_law_1.01,0.5904831886291504
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,7168,2048,8,256,1,16,power_law_1.2,0.8404671669006347
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,7168,2048,8,256,1,16,power_law_1.01,0.3546367883682251
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,7168,2048,8,256,1,16,power_law_1.01,0.7634687900543213
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,7168,2048,8,256,1,16,power_law_1.2,0.9288512229919433
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,7168,2048,8,256,1,16,power_law_1.01,0.8967743873596191
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,7168,2048,8,256,1,16,power_law_1.2,1.2866559982299806
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,256,1,16,power_law_1.01,0.32591359615325927
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,7168,2048,8,256,1,16,power_law_1.01,1.3280896186828612
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,7168,2048,8,256,1,16,power_law_1.2,1.7331520080566407
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,256,1,16,power_law_1.01,0.43063039779663087
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,7168,2048,8,256,1,16,power_law_1.01,1.72108154296875
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,7168,2048,8,256,1,16,power_law_1.2,2.184339141845703
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,7168,2048,8,256,1,16,balanced,2.191194693247477
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,256,1,16,power_law_1.01,0.5035200119018555
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,7168,2048,8,256,1,16,power_law_1.01,2.2360639572143555
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,7168,2048,8,256,1,16,power_law_1.2,2.824851226806641
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,256,1,16,power_law_1.01,0.662988805770874
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,256,1,16,balanced,1.931173324584961
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,7168,2048,8,256,1,16,power_law_1.2,4.021567916870117
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,7168,2048,8,256,1,16,power_law_1.01,3.124799919128418
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,256,1,16,power_law_1.01,0.839897632598877
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,256,1,16,power_law_1.01,1.1372415542602539
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,7168,2048,8,256,1,16,power_law_1.2,6.174316787719727
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,7168,2048,8,256,1,16,power_law_1.01,7.148242950439453
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,256,1,16,power_law_1.01,1.5429759979248048
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,256,1,16,power_law_1.01,1.9969663619995117
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,7168,2048,8,256,1,16,power_law_1.2,12.772102355957031
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,7168,2048,8,256,1,16,power_law_1.2,0.13326719999313355
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,256,1,16,power_law_1.01,2.897126388549805
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,7168,2048,8,256,1,16,power_law_1.2,0.1978495955467224
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,256,1,16,power_law_1.01,3.557542419433594
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,7168,2048,8,256,1,16,power_law_1.2,0.082150399684906
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,256,1,16,power_law_1.01,5.3900096893310545
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,7168,2048,8,256,1,16,power_law_1.2,0.09478399753570557
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,7168,2048,8,256,1,16,power_law_1.2,0.12153600454330445
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,256,1,16,power_law_1.01,10.880441284179687
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,7168,2048,8,256,1,16,power_law_1.2,0.1320512056350708
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,256,1,16,balanced,3.0429865519205728
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,7168,2048,8,256,1,16,power_law_1.2,0.17870080471038818
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,7168,2048,8,256,1,16,balanced,4.959578514099121
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,7168,2048,8,256,1,16,power_law_1.2,0.1704256057739258
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,7168,2048,8,256,1,16,power_law_1.2,0.17679359912872314
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,7168,2048,8,256,1,16,power_law_1.2,0.1912511944770813
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,7168,2048,8,256,1,16,power_law_1.2,0.19767680168151855
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,7168,2048,8,256,1,16,power_law_1.2,0.21109120845794677
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,7168,2048,8,256,1,16,power_law_1.2,0.21106560230255128
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,7168,2048,8,256,1,16,power_law_1.2,0.22970240116119384
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,7168,2048,8,256,1,16,balanced,4.306469281514485
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,7168,2048,8,256,1,16,power_law_1.2,0.24499199390411378
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,7168,2048,8,256,1,16,power_law_1.2,0.25109119415283204
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,7168,2048,8,256,1,16,power_law_1.2,0.25639679431915285
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,7168,2048,8,256,1,16,power_law_1.2,0.2969599962234497
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,7168,2048,8,256,1,16,power_law_1.2,0.31578240394592283
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,7168,2048,8,256,1,16,power_law_1.2,0.39312000274658204
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,7168,2048,8,256,1,16,power_law_1.2,0.43157758712768557
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,7168,2048,8,256,1,16,power_law_1.2,0.5154751777648926
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,7168,2048,8,256,1,16,power_law_1.2,0.6424320220947266
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,7168,2048,8,256,1,16,power_law_1.2,0.8881279945373535
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,7168,2048,8,256,1,16,power_law_1.2,1.1819775581359864
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,256,1,16,balanced,6.07913080851237
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,7168,2048,8,256,1,16,power_law_1.2,1.5955455780029297
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,7168,2048,8,256,1,16,power_law_1.2,2.043519973754883
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,7168,2048,8,256,1,16,power_law_1.2,2.5356800079345705
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,7168,2048,8,256,1,16,power_law_1.2,4.37896957397461
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,7168,2048,8,256,1,16,power_law_1.2,8.935469055175782
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,7168,2048,8,256,1,16,power_law_1.2,0.1335935950279236
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,7168,2048,8,256,1,16,power_law_1.2,0.20288000106811524
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,7168,2048,8,256,1,16,power_law_1.2,0.08339200019836426
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,7168,2048,8,256,1,16,power_law_1.2,0.0976639986038208
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,7168,2048,8,256,1,16,power_law_1.2,0.12235519886016846
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,7168,2048,8,256,1,16,power_law_1.2,0.13160320520401
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,7168,2048,8,256,1,16,power_law_1.2,0.17490559816360474
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,7168,2048,8,256,1,16,power_law_1.2,0.18736000061035157
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,7168,2048,8,256,1,16,power_law_1.2,0.18408960103988647
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,7168,2048,8,256,1,16,power_law_1.2,0.20039041042327882
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,7168,2048,8,256,1,16,power_law_1.2,0.20864639282226563
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,7168,2048,8,256,1,16,power_law_1.2,0.22807679176330567
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,7168,2048,8,256,1,16,power_law_1.2,0.24583039283752442
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,7168,2048,8,256,1,16,power_law_1.2,0.2500351905822754
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,7168,2048,8,256,1,16,power_law_1.2,0.27847039699554443
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,7168,2048,8,256,1,16,power_law_1.2,0.298854398727417
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,7168,2048,8,256,1,16,power_law_1.2,0.3303040027618408
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,7168,2048,8,256,1,16,power_law_1.2,0.3632704019546509
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,256,1,16,power_law_1.2,0.3648319959640503
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,256,1,16,power_law_1.2,0.47482881546020506
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,256,1,16,power_law_1.2,0.5635583877563477
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,256,1,16,power_law_1.2,0.7946559906005859
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,256,1,16,power_law_1.2,0.9388480186462402
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,256,1,16,power_law_1.2,1.1640255928039551
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,256,1,16,power_law_1.2,1.8263359069824219
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,256,1,16,power_law_1.2,2.3127168655395507
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,7168,2048,8,256,2,8,balanced,0.060533334811528526
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,256,1,16,power_law_1.2,3.718592071533203
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,7168,2048,8,256,2,8,balanced,0.06518400212128957
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,7168,2048,8,256,2,8,balanced,0.049866666396458946
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,7168,2048,8,256,2,8,balanced,0.08164266745249431
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,256,1,16,power_law_1.2,4.638252639770508
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,7168,2048,8,256,2,8,balanced,0.1251146694024404
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,7168,2048,8,256,2,8,balanced,0.052389333645502724
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,7168,2048,8,256,2,8,balanced,0.20378132661183676
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,256,1,16,power_law_1.2,7.309913635253906
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,7168,2048,8,256,2,8,balanced,0.06320533156394958
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,7168,2048,8,256,2,8,balanced,0.36790398756663006
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,7168,2048,8,256,2,8,balanced,0.08868799606959026
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,7168,2048,8,256,2,8,balanced,0.3670133352279663
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,7168,2048,8,256,2,8,balanced,0.1302880048751831
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,256,1,16,power_law_1.2,16.11474609375
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,7168,2048,8,256,2,8,balanced,0.21047999461491904
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,7168,2048,8,256,2,8,balanced,0.37083733081817627
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,7168,2048,8,256,2,8,balanced,0.21260799964269003
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,7168,2048,8,256,2,8,balanced,0.3685866594314575
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,7168,2048,8,256,2,8,balanced,0.21268266439437866
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,7168,2048,8,256,2,8,balanced,0.36859198411305744
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,7168,2048,8,256,2,8,balanced,0.21309866507848105
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,7168,2048,8,256,2,8,balanced,0.37028801441192627
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,7168,2048,8,256,2,8,balanced,0.21448532740275064
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,7168,2048,8,256,2,8,balanced,0.21811733643213907
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,7168,2048,8,256,2,8,balanced,0.3741866747538249
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,7168,2048,8,256,2,8,balanced,0.2193280061086019
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,7168,2048,8,256,2,8,balanced,0.3734453519185384
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,7168,2048,8,256,2,8,balanced,0.22150399287541708
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,7168,2048,8,256,2,8,balanced,0.37675201892852783
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,7168,2048,8,256,2,8,balanced,0.22466667493184408
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,7168,2048,8,256,2,8,balanced,0.382917324701945
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,7168,2048,8,256,2,8,power_law_1.01,0.11961599588394164
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,7168,2048,8,256,2,8,balanced,0.2330346703529358
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,7168,2048,8,256,2,8,balanced,0.3858559926350911
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,7168,2048,8,256,2,8,balanced,0.04859733581542969
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,7168,2048,8,256,2,8,balanced,0.23660266399383545
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,7168,2048,8,256,2,8,balanced,0.3932373523712158
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,7168,2048,8,256,2,8,power_law_1.01,0.19978879690170287
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,7168,2048,8,256,2,8,balanced,0.053354665637016296
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,7168,2048,8,256,2,8,balanced,0.0659093310435613
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,7168,2048,8,256,2,8,balanced,0.24394667148590088
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,7168,2048,8,256,2,8,power_law_1.01,0.10581760406494141
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,7168,2048,8,256,2,8,balanced,0.41733864943186444
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,7168,2048,8,256,2,8,balanced,0.09347732861836751
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,7168,2048,8,256,2,8,power_law_1.01,0.12126719951629639
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,7168,2048,8,256,2,8,balanced,0.2585759957631429
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,7168,2048,8,256,2,8,balanced,0.42955199877421063
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,7168,2048,8,256,2,8,balanced,0.13753066460291544
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,7168,2048,8,256,2,8,power_law_1.01,0.15957119464874267
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,7168,2048,8,256,2,8,balanced,0.2124906579653422
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,7168,2048,8,256,2,8,balanced,0.2747199932734172
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,7168,2048,8,256,2,8,power_law_1.01,0.08692479729652405
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,7168,2048,8,256,2,8,balanced,0.4487626552581787
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,7168,2048,8,256,2,8,power_law_1.01,0.21942400932312012
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,7168,2048,8,256,2,8,balanced,0.21444799502690634
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,7168,2048,8,256,2,8,power_law_1.01,0.12335360050201416
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,7168,2048,8,256,2,8,power_law_1.01,0.27128961086273196
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,7168,2048,8,256,2,8,balanced,0.3219253420829773
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,7168,2048,8,256,2,8,balanced,0.21439466873804727
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,7168,2048,8,256,2,8,balanced,0.4843466679255168
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,7168,2048,8,256,2,8,power_law_1.01,0.2912512063980103
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,7168,2048,8,256,2,8,balanced,0.21688532829284668
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,7168,2048,8,256,2,8,power_law_1.01,0.0674560010433197
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,7168,2048,8,256,2,8,balanced,0.33985066413879395
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,7168,2048,8,256,2,8,balanced,0.21714133024215698
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,7168,2048,8,256,2,8,power_law_1.01,0.3038655996322632
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,7168,2048,8,256,2,8,power_law_1.01,0.08170880079269409
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,7168,2048,8,256,2,8,balanced,0.5263520081837972
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,7168,2048,8,256,2,8,balanced,0.22033600012461343
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,7168,2048,8,256,2,8,power_law_1.01,0.3002624034881592
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,7168,2048,8,256,2,8,power_law_1.01,0.11775360107421876
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,7168,2048,8,256,2,8,balanced,0.22276800870895386
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,7168,2048,8,256,2,8,balanced,0.3977280060450236
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,7168,2048,8,256,2,8,power_law_1.01,0.32106881141662597
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,7168,2048,8,256,2,8,power_law_1.01,0.1435263991355896
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,7168,2048,8,256,2,8,balanced,0.5679839849472046
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,7168,2048,8,256,2,8,balanced,0.2265066703160604
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,7168,2048,8,256,2,8,power_law_1.01,0.3371392011642456
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,7168,2048,8,256,2,8,power_law_1.01,0.16513919830322266
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,7168,2048,8,256,2,8,balanced,0.22961600621541342
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,7168,2048,8,256,2,8,power_law_1.01,0.34547200202941897
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,7168,2048,8,256,2,8,balanced,0.45317331949869794
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,7168,2048,8,256,2,8,power_law_1.01,0.17530879974365235
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,7168,2048,8,256,2,8,balanced,0.2392746607462565
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,7168,2048,8,256,2,8,power_law_1.01,0.3546047925949097
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,7168,2048,8,256,2,8,balanced,0.7423199812571207
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,7168,2048,8,256,2,8,power_law_1.01,0.18316800594329835
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,7168,2048,8,256,2,8,balanced,0.24289067586263022
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,7168,2048,8,256,2,8,power_law_1.01,0.38858880996704104
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,7168,2048,8,256,2,8,balanced,0.2536960045496623
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,7168,2048,8,256,2,8,power_law_1.01,0.18919680118560792
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,7168,2048,8,256,2,8,balanced,0.6051679849624634
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,7168,2048,8,256,2,8,power_law_1.01,0.399833607673645
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,7168,2048,8,256,2,8,power_law_1.01,0.186188805103302
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,7168,2048,8,256,2,8,power_law_1.01,0.4047552108764648
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,7168,2048,8,256,2,8,power_law_1.01,0.2076416015625
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,7168,2048,8,256,2,8,balanced,0.8253280321756998
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,7168,2048,8,256,2,8,power_law_1.01,0.470963191986084
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,7168,2048,8,256,2,8,power_law_1.01,0.19992320537567138
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,7168,2048,8,256,2,8,power_law_1.01,0.46640639305114745
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,7168,2048,8,256,2,8,balanced,0.2800106604894002
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,7168,2048,8,256,2,8,power_law_1.01,0.21614720821380615
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,7168,2048,8,256,2,8,balanced,0.7165173689524332
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,7168,2048,8,256,2,8,power_law_1.01,0.5708479881286621
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,7168,2048,8,256,2,8,power_law_1.01,0.23327360153198243
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,7168,2048,8,256,2,8,power_law_1.01,0.5473087787628174
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,7168,2048,8,256,2,8,power_law_1.01,0.2603775978088379
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,7168,2048,8,256,2,8,power_law_1.01,0.0970687985420227
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,7168,2048,8,256,2,8,power_law_1.01,0.665555191040039
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,7168,2048,8,256,2,8,power_law_1.01,0.23717119693756103
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,7168,2048,8,256,2,8,balanced,1.146399974822998
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,7168,2048,8,256,2,8,power_law_1.01,0.13515520095825195
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,7168,2048,8,256,2,8,power_law_1.01,0.8067328453063964
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,7168,2048,8,256,2,8,power_law_1.01,0.27878398895263673
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,7168,2048,8,256,2,8,power_law_1.01,0.09800959825515747
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,7168,2048,8,256,2,8,power_law_1.01,1.0587264060974122
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,7168,2048,8,256,2,8,balanced,1.0206560293833415
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,7168,2048,8,256,2,8,power_law_1.01,0.3062016010284424
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,256,2,8,balanced,0.30267200867335003
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,7168,2048,8,256,2,8,power_law_1.01,0.08970239758491516
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,7168,2048,8,256,2,8,power_law_1.01,1.2347135543823242
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,7168,2048,8,256,2,8,power_law_1.01,0.3634752035140991
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,7168,2048,8,256,2,8,power_law_1.2,0.13150080442428588
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,7168,2048,8,256,2,8,power_law_1.01,0.12356480360031127
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,7168,2048,8,256,2,8,power_law_1.01,1.9098688125610352
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,256,2,8,balanced,0.349455992380778
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,7168,2048,8,256,2,8,power_law_1.01,0.3792383909225464
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,7168,2048,8,256,2,8,power_law_1.2,0.19601919651031494
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,7168,2048,8,256,2,8,power_law_1.01,0.13096319437026976
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,7168,2048,8,256,2,8,power_law_1.2,0.09679359793663025
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,7168,2048,8,256,2,8,power_law_1.01,2.3045631408691407
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,7168,2048,8,256,2,8,power_law_1.01,0.48192639350891114
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,256,2,8,balanced,0.3877013524373372
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,7168,2048,8,256,2,8,power_law_1.01,0.17317119836807252
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,7168,2048,8,256,2,8,power_law_1.2,0.12464640140533448
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,7168,2048,8,256,2,8,power_law_1.01,0.5814527988433837
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,7168,2048,8,256,2,8,power_law_1.01,3.024332809448242
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,7168,2048,8,256,2,8,balanced,1.4794027010599773
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,7168,2048,8,256,2,8,power_law_1.2,0.16462080478668212
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,7168,2048,8,256,2,8,power_law_1.01,0.19368959665298463
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,7168,2048,8,256,2,8,power_law_1.2,0.20547199249267578
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,256,2,8,balanced,0.5122666756312052
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,7168,2048,8,256,2,8,power_law_1.01,0.7755136013031005
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,7168,2048,8,256,2,8,power_law_1.2,0.2877568006515503
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,7168,2048,8,256,2,8,power_law_1.01,0.19182080030441284
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,7168,2048,8,256,2,8,power_law_1.01,4.318745422363281
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,7168,2048,8,256,2,8,balanced,1.3070933024088542
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,7168,2048,8,256,2,8,power_law_1.2,0.30517120361328126
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,7168,2048,8,256,2,8,power_law_1.01,0.962451171875
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,7168,2048,8,256,2,8,power_law_1.01,0.1911743998527527
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,7168,2048,8,256,2,8,power_law_1.2,0.31831040382385256
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,256,2,8,balanced,0.5904959837595621
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,7168,2048,8,256,2,8,power_law_1.01,8.908102416992188
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,7168,2048,8,256,2,8,power_law_1.01,1.442790412902832
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,7168,2048,8,256,2,8,power_law_1.01,0.2131648063659668
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,7168,2048,8,256,2,8,power_law_1.2,0.2999232053756714
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,7168,2048,8,256,2,8,power_law_1.2,0.32309761047363283
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,7168,2048,8,256,2,8,power_law_1.01,0.22317440509796144
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,7168,2048,8,256,2,8,power_law_1.01,1.6977472305297852
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,7168,2048,8,256,2,8,power_law_1.2,0.3359872102737427
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,7168,2048,8,256,2,8,power_law_1.01,0.2225343942642212
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,7168,2048,8,256,2,8,power_law_1.2,0.34678399562835693
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,7168,2048,8,256,2,8,power_law_1.01,2.0984832763671877
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,256,2,8,balanced,0.8926880359649658
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,7168,2048,8,256,2,8,power_law_1.2,0.37521920204162595
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,7168,2048,8,256,2,8,power_law_1.01,0.24007680416107177
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,7168,2048,8,256,2,8,power_law_1.2,0.3844095945358276
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,7168,2048,8,256,2,8,power_law_1.01,3.4219009399414064
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,7168,2048,8,256,2,8,balanced,1.814517339070638
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,7168,2048,8,256,2,8,power_law_1.01,0.2617088079452515
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,7168,2048,8,256,2,8,power_law_1.2,0.4341760158538818
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,7168,2048,8,256,2,8,power_law_1.2,0.4460927963256836
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,7168,2048,8,256,2,8,power_law_1.01,0.2861311912536621
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,7168,2048,8,256,2,8,power_law_1.2,0.4843711853027344
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,7168,2048,8,256,2,8,power_law_1.01,6.760959625244141
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,256,2,8,balanced,1.0553867022196453
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,7168,2048,8,256,2,8,balanced,1.6400532722473145
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,7168,2048,8,256,2,8,power_law_1.2,0.5283391952514649
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,7168,2048,8,256,2,8,power_law_1.01,0.32629120349884033
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,7168,2048,8,256,2,8,power_law_1.2,0.6007936000823975
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,7168,2048,8,256,2,8,power_law_1.2,0.6189055919647217
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,7168,2048,8,256,2,8,power_law_1.2,0.7027008056640625
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,7168,2048,8,256,2,8,power_law_1.01,0.35036799907684324
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,7168,2048,8,256,2,8,power_law_1.2,0.9301440238952636
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,7168,2048,8,256,2,8,power_law_1.2,1.084780788421631
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,7168,2048,8,256,2,8,power_law_1.2,1.3607359886169434
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,256,2,8,balanced,1.5592320760091145
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,256,2,8,power_law_1.01,0.3393728017807007
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,7168,2048,8,256,2,8,power_law_1.2,2.0363840103149413
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,256,2,8,power_law_1.01,0.45813760757446287
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,7168,2048,8,256,2,8,power_law_1.2,2.613542366027832
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,256,2,8,power_law_1.01,0.5469567775726318
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,7168,2048,8,256,2,8,power_law_1.2,3.389759826660156
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,256,2,8,power_law_1.01,0.6894144058227539
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,7168,2048,8,256,2,8,power_law_1.2,5.587340927124023
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,7168,2048,8,256,2,8,balanced,2.843008041381836
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,256,2,8,power_law_1.01,0.871065616607666
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,256,2,8,power_law_1.01,1.1543423652648925
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,7168,2048,8,256,2,8,power_law_1.2,10.169465637207031
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,256,2,8,balanced,2.064138730367025
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,7168,2048,8,256,2,8,balanced,2.527498722076416
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,256,2,8,power_law_1.01,1.5473407745361327
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,256,2,8,power_law_1.01,2.271219253540039
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,256,2,8,power_law_1.01,2.924799919128418
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,256,2,8,power_law_1.01,3.887071990966797
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,256,2,8,power_law_1.01,5.905516815185547
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,7168,2048,8,256,2,8,power_law_1.2,0.08685439825057983
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,256,2,8,balanced,2.561845302581787
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,256,2,8,power_law_1.01,10.970342254638672
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,7168,2048,8,256,2,8,power_law_1.2,0.12341120243072509
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,7168,2048,8,256,2,8,power_law_1.2,0.06058239936828613
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,7168,2048,8,256,2,8,power_law_1.2,0.0933247983455658
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,7168,2048,8,256,2,8,power_law_1.2,0.11095679998397827
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,7168,2048,8,256,2,8,power_law_1.2,0.1196671962738037
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,7168,2048,8,256,2,8,power_law_1.2,0.17342079877853395
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,7168,2048,8,256,2,8,power_law_1.2,0.18177920579910278
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,7168,2048,8,256,2,8,power_law_1.2,0.17931519746780394
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,7168,2048,8,256,2,8,power_law_1.2,0.17885440587997437
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,7168,2048,8,256,2,8,power_law_1.2,0.19252480268478395
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,256,2,8,balanced,4.034624099731445
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,7168,2048,8,256,2,8,power_law_1.2,0.20274560451507567
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,7168,2048,8,256,2,8,balanced,5.6510880788167315
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,7168,2048,8,256,2,8,power_law_1.2,0.21457281112670898
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,7168,2048,8,256,2,8,power_law_1.2,0.22561280727386473
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,7168,2048,8,256,2,8,power_law_1.2,0.24510080814361573
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,7168,2048,8,256,2,8,balanced,4.973557472229004
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,7168,2048,8,256,2,8,power_law_1.2,0.2605952024459839
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,7168,2048,8,256,2,8,power_law_1.2,0.2736704111099243
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,7168,2048,8,256,2,8,power_law_1.2,0.2931839942932129
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,7168,2048,8,256,2,8,power_law_1.2,0.32467200756073
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,7168,2048,8,256,2,8,power_law_1.2,0.3934528112411499
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,7168,2048,8,256,2,8,power_law_1.2,0.41052799224853515
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,7168,2048,8,256,2,8,power_law_1.2,0.5172863960266113
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,7168,2048,8,256,2,8,power_law_1.2,0.6619840145111084
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,7168,2048,8,256,2,8,power_law_1.2,0.8310720443725585
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,7168,2048,8,256,2,8,power_law_1.2,1.058233642578125
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,7168,2048,8,256,2,8,power_law_1.2,1.5020095825195312
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,7168,2048,8,256,2,8,power_law_1.2,1.994905662536621
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,7168,2048,8,256,2,8,power_law_1.2,2.681331253051758
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,7168,2048,8,256,2,8,power_law_1.2,4.124576187133789
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,7168,2048,8,256,2,8,power_law_1.2,9.514086151123047
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,256,2,8,balanced,8.086106618245443
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,7168,2048,8,256,2,8,power_law_1.2,0.09654399752616882
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,7168,2048,8,256,2,8,power_law_1.2,0.130457603931427
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,7168,2048,8,256,2,8,power_law_1.2,0.06891520023345947
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,7168,2048,8,256,2,8,power_law_1.2,0.0933568000793457
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,7168,2048,8,256,4,4,balanced,0.05866133173306783
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,7168,2048,8,256,2,8,power_law_1.2,0.11552640199661254
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,7168,2048,8,256,4,4,balanced,0.06594133377075195
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,7168,2048,8,256,2,8,power_law_1.2,0.14545279741287231
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,7168,2048,8,256,4,4,balanced,0.08247466882069905
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,7168,2048,8,256,2,8,power_law_1.2,0.177183997631073
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,7168,2048,8,256,4,4,balanced,0.127509335676829
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,7168,2048,8,256,2,8,power_law_1.2,0.17153919935226442
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,7168,2048,8,256,4,4,balanced,0.20427733659744263
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,7168,2048,8,256,4,4,balanced,0.3707520167032878
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,7168,2048,8,256,2,8,power_law_1.2,0.18279039859771729
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,7168,2048,8,256,4,4,balanced,0.37218666076660156
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,7168,2048,8,256,2,8,power_law_1.2,0.19124480485916137
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,7168,2048,8,256,4,4,balanced,0.3757226864496867
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,7168,2048,8,256,4,4,balanced,0.3748319943745931
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,7168,2048,8,256,2,8,power_law_1.2,0.20454399585723876
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,7168,2048,8,256,4,4,balanced,0.37857067584991455
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,7168,2048,8,256,2,8,power_law_1.2,0.22853119373321534
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,7168,2048,8,256,4,4,balanced,0.3751946687698364
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,7168,2048,8,256,2,8,power_law_1.2,0.22573440074920653
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,7168,2048,8,256,4,4,balanced,0.3808159828186035
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,7168,2048,8,256,4,4,balanced,0.38095466295878094
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,7168,2048,8,256,2,8,power_law_1.2,0.2610752105712891
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,7168,2048,8,256,4,4,balanced,0.3858293294906616
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,7168,2048,8,256,2,8,power_law_1.2,0.2719167947769165
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,7168,2048,8,256,4,4,balanced,0.394048015276591
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,7168,2048,8,256,2,8,power_law_1.2,0.2838912010192871
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,7168,2048,8,256,4,4,balanced,0.3959146738052368
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,7168,2048,8,256,4,4,balanced,0.4036853313446045
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,7168,2048,8,256,2,8,power_law_1.2,0.3200576066970825
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,7168,2048,8,256,4,4,balanced,0.42978131771087646
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,7168,2048,8,256,4,4,balanced,0.4591840108235677
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,7168,2048,8,256,4,4,balanced,0.049466664592425026
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,7168,2048,8,256,2,8,power_law_1.2,0.38576641082763674
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,7168,2048,8,256,4,4,balanced,0.05376533170541128
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,7168,2048,8,256,4,4,balanced,0.4856160084406535
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,7168,2048,8,256,4,4,balanced,0.06498666604359944
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,7168,2048,8,256,4,4,balanced,0.5240213473637899
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,7168,2048,8,256,4,4,balanced,0.0913759966691335
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,7168,2048,8,256,4,4,balanced,0.13831466436386108
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,256,2,8,power_law_1.2,0.38142080307006837
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,7168,2048,8,256,4,4,balanced,0.2161066730817159
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,7168,2048,8,256,4,4,balanced,0.5884799957275391
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,256,2,8,power_law_1.2,0.4634751796722412
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,7168,2048,8,256,4,4,balanced,0.21760533253351846
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,256,2,8,power_law_1.2,0.617299222946167
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,7168,2048,8,256,4,4,balanced,0.2192373275756836
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,7168,2048,8,256,4,4,balanced,0.6621493498484293
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,7168,2048,8,256,4,4,balanced,0.2220159967740377
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,256,2,8,power_law_1.2,0.7768320083618164
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,7168,2048,8,256,4,4,balanced,0.22367999951044717
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,256,2,8,power_law_1.2,0.9809599876403808
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,7168,2048,8,256,4,4,balanced,0.22641066710154215
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,256,2,8,power_law_1.2,1.358297634124756
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,7168,2048,8,256,4,4,balanced,0.2291733423868815
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,7168,2048,8,256,4,4,balanced,0.8649493058522543
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,7168,2048,8,256,4,4,balanced,0.23360000054041544
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,256,2,8,power_law_1.2,1.8464704513549806
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,7168,2048,8,256,4,4,balanced,0.2378879984219869
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,256,2,8,power_law_1.2,2.754969596862793
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,7168,2048,8,256,4,4,balanced,0.24702932437260947
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,7168,2048,8,256,4,4,balanced,0.25076266129811603
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,256,2,8,power_law_1.2,3.8558719635009764
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,7168,2048,8,256,4,4,balanced,0.9954240322113037
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,7168,2048,8,256,4,4,balanced,0.26187199354171753
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,256,2,8,power_law_1.2,4.685292816162109
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,7168,2048,8,256,4,4,balanced,0.27957334121068317
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,256,2,8,power_law_1.2,7.662022399902344
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,7168,2048,8,256,4,4,balanced,0.31303999821345013
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,7168,2048,8,256,4,4,balanced,0.35636266072591144
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,7168,2048,8,256,4,4,balanced,1.3903199831644695
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,256,2,8,power_law_1.2,13.843263244628906
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,7168,2048,8,256,4,4,balanced,0.3908960024515788
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,7168,2048,8,256,4,4,balanced,0.05903466542561849
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,7168,2048,8,256,4,4,power_law_1.01,0.08570240139961242
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,7168,2048,8,256,4,4,balanced,0.4667359987894694
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,7168,2048,8,256,4,4,balanced,0.06560533245404561
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,7168,2048,8,256,4,4,power_law_1.01,0.12004480361938477
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,7168,2048,8,256,4,4,balanced,0.0759626676638921
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,7168,2048,8,256,4,4,balanced,0.5378079811731974
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,7168,2048,8,256,4,4,power_law_1.01,0.07467520236968994
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,7168,2048,8,256,4,4,balanced,0.102101335922877
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,7168,2048,8,256,4,4,balanced,1.8086454073588054
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,7168,2048,8,256,4,4,power_law_1.01,0.10874240398406983
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,7168,2048,8,256,4,4,balanced,0.14986133575439453
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,7168,2048,8,256,4,4,power_law_1.01,0.1715456008911133
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,7168,2048,8,256,4,4,balanced,0.23131734132766724
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,7168,2048,8,256,4,4,balanced,0.7430453300476074
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,7168,2048,8,256,4,4,power_law_1.01,0.21843841075897216
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,7168,2048,8,256,4,4,balanced,0.23502933979034424
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,7168,2048,8,256,4,4,power_law_1.01,0.06261759996414185
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,7168,2048,8,256,4,4,balanced,0.23514666159947714
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,7168,2048,8,256,4,4,power_law_1.01,0.28134400844573976
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,7168,2048,8,256,4,4,balanced,0.23853333791097006
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,7168,2048,8,256,4,4,power_law_1.01,0.2994879961013794
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,7168,2048,8,256,4,4,power_law_1.01,0.08356480002403259
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,7168,2048,8,256,4,4,balanced,0.23989866177241007
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,7168,2048,8,256,4,4,balanced,0.892959992090861
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,7168,2048,8,256,4,4,power_law_1.01,0.29605119228363036
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,7168,2048,8,256,4,4,power_law_1.01,0.0723136007785797
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,7168,2048,8,256,4,4,balanced,0.24366400639216104
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,7168,2048,8,256,4,4,power_law_1.01,0.3036799907684326
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,7168,2048,8,256,4,4,power_law_1.01,0.08183040022850037
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,7168,2048,8,256,4,4,balanced,0.24819199244181314
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,7168,2048,8,256,4,4,balanced,2.208693345387777
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,7168,2048,8,256,4,4,power_law_1.01,0.3123775959014893
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,7168,2048,8,256,4,4,power_law_1.01,0.1149440050125122
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,7168,2048,8,256,4,4,balanced,0.2531306743621826
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,7168,2048,8,256,4,4,power_law_1.01,0.1409152030944824
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,7168,2048,8,256,4,4,balanced,0.2601813276608785
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,7168,2048,8,256,4,4,power_law_1.01,0.3351423978805542
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,7168,2048,8,256,4,4,power_law_1.01,0.17605760097503662
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,7168,2048,8,256,4,4,power_law_1.01,0.3419519901275635
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,7168,2048,8,256,4,4,balanced,0.27290133635203045
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,7168,2048,8,256,4,4,balanced,1.2745280265808105
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,7168,2048,8,256,4,4,power_law_1.01,0.17411839962005615
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,7168,2048,8,256,4,4,power_law_1.01,0.3500159978866577
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,7168,2048,8,256,4,4,balanced,0.2817280093828837
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,7168,2048,8,256,4,4,power_law_1.01,0.18586879968643188
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,7168,2048,8,256,4,4,power_law_1.01,0.3714495897293091
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,7168,2048,8,256,4,4,balanced,0.2940959930419922
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,7168,2048,8,256,4,4,power_law_1.01,0.18906879425048828
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,7168,2048,8,256,4,4,power_law_1.01,0.4020671844482422
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,7168,2048,8,256,4,4,power_law_1.01,0.19896960258483887
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,7168,2048,8,256,4,4,power_law_1.01,0.4159103870391846
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,7168,2048,8,256,4,4,power_law_1.01,0.20510718822479249
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,7168,2048,8,256,4,4,power_law_1.01,0.47696638107299805
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,7168,2048,8,256,4,4,power_law_1.01,0.48200321197509766
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,7168,2048,8,256,4,4,balanced,0.3314080039660136
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,7168,2048,8,256,4,4,power_law_1.01,0.21261439323425294
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,7168,2048,8,256,4,4,balanced,1.6260426839192708
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,7168,2048,8,256,4,4,power_law_1.01,0.5433407783508301
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,7168,2048,8,256,4,4,power_law_1.01,0.2280639886856079
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,7168,2048,8,256,4,4,power_law_1.01,0.5814208030700684
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,7168,2048,8,256,4,4,power_law_1.01,0.2378688097000122
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,7168,2048,8,256,4,4,power_law_1.01,0.7117311954498291
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,7168,2048,8,256,4,4,balanced,3.5107361475626626
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,7168,2048,8,256,4,4,power_law_1.01,0.25384318828582764
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,7168,2048,8,256,4,4,power_law_1.01,0.8111167907714844
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,7168,2048,8,256,4,4,power_law_1.01,0.2634176015853882
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,7168,2048,8,256,4,4,power_law_1.01,1.0689151763916016
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,256,4,4,balanced,0.3962133328119914
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,7168,2048,8,256,4,4,power_law_1.01,0.31220479011535646
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,7168,2048,8,256,4,4,power_law_1.01,1.4061375617980958
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,7168,2048,8,256,4,4,power_law_1.01,0.3191999912261963
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,256,4,4,balanced,0.4845386743545532
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,7168,2048,8,256,4,4,power_law_1.2,0.08531200289726257
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,7168,2048,8,256,4,4,power_law_1.01,1.8848703384399415
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,7168,2048,8,256,4,4,balanced,2.089845339457194
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,7168,2048,8,256,4,4,power_law_1.01,0.3797760009765625
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,7168,2048,8,256,4,4,power_law_1.2,0.11365760564804077
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,256,4,4,balanced,0.5373440186182658
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,7168,2048,8,256,4,4,power_law_1.01,2.447225570678711
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,7168,2048,8,256,4,4,power_law_1.01,0.44626560211181643
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,7168,2048,8,256,4,4,power_law_1.2,0.07650560140609741
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,7168,2048,8,256,4,4,power_law_1.01,0.08065919876098633
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,7168,2048,8,256,4,4,power_law_1.01,2.8807296752929688
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,7168,2048,8,256,4,4,power_law_1.01,0.5624320030212402
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,7168,2048,8,256,4,4,power_law_1.2,0.11689599752426147
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,256,4,4,balanced,0.7237280209859213
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,7168,2048,8,256,4,4,power_law_1.01,0.10153599977493286
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,7168,2048,8,256,4,4,power_law_1.01,0.6494912147521973
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,7168,2048,8,256,4,4,power_law_1.2,0.15678720474243163
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,7168,2048,8,256,4,4,power_law_1.01,4.215046310424805
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,7168,2048,8,256,4,4,power_law_1.01,0.08183040022850037
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,7168,2048,8,256,4,4,power_law_1.01,0.873100757598877
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,7168,2048,8,256,4,4,power_law_1.2,0.18869760036468505
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,7168,2048,8,256,4,4,power_law_1.01,0.09644799828529357
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,256,4,4,balanced,0.8496533234914144
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,7168,2048,8,256,4,4,power_law_1.2,0.26625919342041016
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,7168,2048,8,256,4,4,power_law_1.01,8.387078094482423
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,7168,2048,8,256,4,4,power_law_1.01,1.0808704376220704
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,7168,2048,8,256,4,4,power_law_1.01,0.12055679559707641
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,7168,2048,8,256,4,4,power_law_1.2,0.28971519470214846
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,7168,2048,8,256,4,4,power_law_1.01,0.14797439575195312
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,7168,2048,8,256,4,4,power_law_1.01,1.5898688316345215
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,7168,2048,8,256,4,4,power_law_1.2,0.300435209274292
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,7168,2048,8,256,4,4,power_law_1.01,0.17582720518112183
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,256,4,4,balanced,1.286906639734904
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,7168,2048,8,256,4,4,power_law_1.01,2.086841583251953
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,7168,2048,8,256,4,4,power_law_1.2,0.3034111976623535
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,7168,2048,8,256,4,4,power_law_1.01,0.19774080514907838
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,7168,2048,8,256,4,4,power_law_1.01,2.3528064727783202
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,7168,2048,8,256,4,4,power_law_1.2,0.32120959758758544
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,7168,2048,8,256,4,4,power_law_1.01,0.20119040012359618
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,7168,2048,8,256,4,4,power_law_1.2,0.33203198909759524
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,7168,2048,8,256,4,4,power_law_1.01,0.21162240505218505
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,7168,2048,8,256,4,4,power_law_1.01,3.7223934173583983
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,7168,2048,8,256,4,4,balanced,3.1644585927327475
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,256,4,4,balanced,1.5638453165690105
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,7168,2048,8,256,4,4,power_law_1.2,0.3422271966934204
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,7168,2048,8,256,4,4,power_law_1.01,0.21920640468597413
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,7168,2048,8,256,4,4,power_law_1.2,0.3573568105697632
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,7168,2048,8,256,4,4,power_law_1.01,0.23944320678710937
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,7168,2048,8,256,4,4,power_law_1.01,7.935116577148437
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,7168,2048,8,256,4,4,power_law_1.2,0.38519039154052737
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,7168,2048,8,256,4,4,power_law_1.01,0.2361920118331909
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,7168,2048,8,256,4,4,power_law_1.01,0.25824000835418703
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,7168,2048,8,256,4,4,power_law_1.2,0.4047743797302246
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,7168,2048,8,256,4,4,power_law_1.01,0.28421759605407715
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,7168,2048,8,256,4,4,power_law_1.2,0.44406399726867674
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,256,4,4,balanced,2.3140427271525064
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,7168,2048,8,256,4,4,power_law_1.01,0.3092351913452148
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,7168,2048,8,256,4,4,power_law_1.2,0.50862717628479
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,7168,2048,8,256,4,4,balanced,7.023295720418294
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,7168,2048,8,256,4,4,power_law_1.01,0.3470911979675293
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,7168,2048,8,256,4,4,power_law_1.2,0.5070847988128662
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,7168,2048,8,256,4,4,power_law_1.2,0.5905792236328125
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,7168,2048,8,256,4,4,power_law_1.01,0.4173759937286377
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,7168,2048,8,256,4,4,power_law_1.2,0.6201536178588867
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,7168,2048,8,256,4,4,power_law_1.2,0.759065580368042
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,256,4,4,power_law_1.01,0.4479487895965576
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,256,4,4,balanced,3.0636374155680337
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,7168,2048,8,256,4,4,power_law_1.2,0.9002431869506836
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,256,4,4,power_law_1.01,0.5588863849639892
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,7168,2048,8,256,4,4,power_law_1.2,1.209132766723633
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,256,4,4,power_law_1.01,0.6724736213684082
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,7168,2048,8,256,4,4,power_law_1.2,1.5523520469665528
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,256,4,4,power_law_1.01,0.8351103782653808
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,7168,2048,8,256,4,4,power_law_1.2,1.857823944091797
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,256,4,4,power_law_1.01,1.0522496223449707
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,7168,2048,8,256,4,4,power_law_1.2,2.5792640686035155
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,256,4,4,power_law_1.01,1.4553919792175294
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,7168,2048,8,256,4,4,power_law_1.2,3.1456512451171874
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,256,4,4,power_law_1.01,2.0089855194091797
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,7168,2048,8,256,4,4,power_law_1.2,4.96648941040039
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,256,4,4,power_law_1.01,2.759052848815918
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,256,4,4,balanced,3.8207839330037436
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,256,4,4,power_law_1.01,3.890227127075195
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,7168,2048,8,256,4,4,power_law_1.2,9.807206726074218
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,7168,2048,8,256,4,4,balanced,6.252373377482097
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,256,4,4,power_law_1.01,5.266124725341797
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,256,4,4,power_law_1.01,7.626636505126953
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,7168,2048,8,256,4,4,power_law_1.2,0.06487680077552796
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,7168,2048,8,256,4,4,power_law_1.2,0.08354560136795045
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,256,4,4,power_law_1.01,14.311616516113281
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,7168,2048,8,256,4,4,power_law_1.2,0.06130560040473938
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,7168,2048,8,256,4,4,power_law_1.2,0.07905279994010925
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,7168,2048,8,256,4,4,power_law_1.2,0.10180480480194092
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,7168,2048,8,256,4,4,power_law_1.2,0.13005440235137938
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,7168,2048,8,256,4,4,power_law_1.2,0.16010240316390992
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,7168,2048,8,256,4,4,power_law_1.2,0.17419519424438476
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,256,4,4,balanced,6.068480173746745
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,7168,2048,8,256,4,4,power_law_1.2,0.17849600315093994
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,7168,2048,8,256,4,4,power_law_1.2,0.18878719806671143
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,7168,2048,8,256,4,4,power_law_1.2,0.19857280254364013
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,7168,2048,8,256,4,4,power_law_1.2,0.21440000534057618
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,7168,2048,8,256,4,4,power_law_1.2,0.2174976110458374
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,7168,2048,8,256,4,4,power_law_1.2,0.22824320793151856
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,7168,2048,8,256,4,4,power_law_1.2,0.2513472080230713
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,7168,2048,8,256,4,4,power_law_1.2,0.25776000022888185
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,7168,2048,8,256,4,4,power_law_1.2,0.2699264049530029
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,7168,2048,8,256,4,4,power_law_1.2,0.31641600131988523
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,7168,2048,8,256,4,4,power_law_1.2,0.3401535987854004
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,7168,2048,8,256,4,4,power_law_1.2,0.41870718002319335
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,7168,2048,8,256,4,4,power_law_1.2,0.49892477989196776
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,7168,2048,8,256,4,4,power_law_1.2,0.6086912155151367
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,7168,2048,8,256,4,4,power_law_1.2,0.6555456161499024
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,7168,2048,8,256,4,4,power_law_1.2,0.9331456184387207
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,7168,2048,8,256,4,4,power_law_1.2,1.196723175048828
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,7168,2048,8,256,4,4,power_law_1.2,1.6974527359008789
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,7168,2048,8,256,4,4,power_law_1.2,2.090777587890625
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,7168,2048,8,256,4,4,power_law_1.2,2.6966976165771483
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,7168,2048,8,256,4,4,power_law_1.2,4.351430511474609
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,7168,2048,8,256,4,4,power_law_1.2,8.64669418334961
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,256,4,4,balanced,12.15777587890625
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,7168,2048,8,256,4,4,power_law_1.2,0.08121600151062011
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,7168,2048,8,256,4,4,power_law_1.2,0.09787520170211791
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,7168,2048,8,256,4,4,power_law_1.2,0.0751039981842041
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,7168,2048,8,256,4,4,power_law_1.2,0.09370239973068237
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,7168,2048,8,256,4,4,power_law_1.2,0.11404800415039062
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,7168,2048,8,256,4,4,power_law_1.2,0.13552000522613525
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,7168,2048,8,256,8,2,balanced,0.05956799785296122
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,7168,2048,8,256,4,4,power_law_1.2,0.18712960481643676
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,7168,2048,8,256,8,2,balanced,0.06846933563550313
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,7168,2048,8,256,8,2,balanced,0.05190933247407278
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,7168,2048,8,256,4,4,power_law_1.2,0.1910912036895752
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,7168,2048,8,256,8,2,balanced,0.08603733777999878
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,7168,2048,8,256,4,4,power_law_1.2,0.1998975992202759
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,7168,2048,8,256,8,2,balanced,0.05663466453552246
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,7168,2048,8,256,8,2,balanced,0.1329813301563263
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,7168,2048,8,256,8,2,balanced,0.21688532829284668
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,7168,2048,8,256,8,2,balanced,0.06900799771149953
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,7168,2048,8,256,4,4,power_law_1.2,0.20924160480499268
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,7168,2048,8,256,8,2,balanced,0.38282668590545654
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,7168,2048,8,256,8,2,balanced,0.09920000036557515
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,7168,2048,8,256,4,4,power_law_1.2,0.21943039894104005
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,7168,2048,8,256,8,2,balanced,0.38513068358103436
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,7168,2048,8,256,8,2,balanced,0.148799995581309
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,7168,2048,8,256,4,4,power_law_1.2,0.2316864013671875
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,7168,2048,8,256,8,2,balanced,0.24409600098927817
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,7168,2048,8,256,8,2,balanced,0.3877120018005371
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,7168,2048,8,256,4,4,power_law_1.2,0.2491391897201538
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,7168,2048,8,256,8,2,balanced,0.24830400943756104
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,7168,2048,8,256,8,2,balanced,0.3911679983139038
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,7168,2048,8,256,8,2,balanced,0.24990934133529663
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,7168,2048,8,256,4,4,power_law_1.2,0.26626560688018797
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,7168,2048,8,256,8,2,balanced,0.39133866628011066
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,7168,2048,8,256,8,2,balanced,0.2542826731999715
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,7168,2048,8,256,4,4,power_law_1.2,0.29687039852142333
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,7168,2048,8,256,8,2,balanced,0.39265600840250653
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,7168,2048,8,256,8,2,balanced,0.2563093304634094
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,7168,2048,8,256,4,4,power_law_1.2,0.3203007936477661
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,7168,2048,8,256,8,2,balanced,0.39764801661173504
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,7168,2048,8,256,8,2,balanced,0.26131733258565265
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,7168,2048,8,256,4,4,power_law_1.2,0.3598975896835327
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,7168,2048,8,256,8,2,balanced,0.3989866574605306
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,7168,2048,8,256,8,2,balanced,0.2672106623649597
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,7168,2048,8,256,8,2,balanced,0.40955201784769696
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,7168,2048,8,256,8,2,balanced,0.2720213333765666
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,7168,2048,8,256,8,2,balanced,0.4192053476969401
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,7168,2048,8,256,8,2,balanced,0.2766079902648926
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,7168,2048,8,256,4,4,power_law_1.2,0.4209472179412842
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,7168,2048,8,256,8,2,balanced,0.2911626696586609
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,7168,2048,8,256,8,2,balanced,0.4240320126215617
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,7168,2048,8,256,8,2,balanced,0.29578665892283124
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,7168,2048,8,256,8,2,balanced,0.44444799423217773
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,256,4,4,power_law_1.2,0.4729919910430908
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,7168,2048,8,256,8,2,balanced,0.3128640055656433
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,7168,2048,8,256,8,2,balanced,0.4731680154800415
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,256,4,4,power_law_1.2,0.6043200016021728
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,7168,2048,8,256,8,2,balanced,0.3383839925130208
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,7168,2048,8,256,8,2,power_law_1.01,0.06591359972953796
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,7168,2048,8,256,8,2,balanced,0.5045173168182373
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,256,4,4,power_law_1.2,0.6982143878936767
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,7168,2048,8,256,8,2,balanced,0.38413333892822266
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,256,4,4,power_law_1.2,0.9061440467834473
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,7168,2048,8,256,8,2,balanced,0.5623573462168375
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,7168,2048,8,256,8,2,power_law_1.01,0.08321279883384705
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,256,4,4,power_law_1.2,1.312166404724121
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,7168,2048,8,256,8,2,power_law_1.01,0.07124480009078979
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,7168,2048,8,256,8,2,balanced,0.44760000705718994
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,7168,2048,8,256,8,2,balanced,0.6423146724700928
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,7168,2048,8,256,8,2,power_law_1.01,0.11109119653701782
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,256,4,4,power_law_1.2,1.6599552154541015
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,7168,2048,8,256,8,2,power_law_1.01,0.166758394241333
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,7168,2048,8,256,8,2,balanced,0.4821919997533162
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,7168,2048,8,256,8,2,balanced,0.08084799846013387
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,256,4,4,power_law_1.2,2.168409538269043
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,7168,2048,8,256,8,2,power_law_1.01,0.21095681190490723
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,7168,2048,8,256,8,2,balanced,0.7411786715189616
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,7168,2048,8,256,8,2,power_law_1.01,0.05589759945869446
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,7168,2048,8,256,8,2,power_law_1.01,0.2708159923553467
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,7168,2048,8,256,8,2,balanced,0.08690133690834045
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,256,4,4,power_law_1.2,3.2660545349121093
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,7168,2048,8,256,8,2,balanced,0.5993813276290894
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,7168,2048,8,256,8,2,power_law_1.01,0.2905535936355591
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,7168,2048,8,256,8,2,power_law_1.01,0.06719359755516052
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,7168,2048,8,256,8,2,balanced,0.09698133667310078
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,7168,2048,8,256,8,2,power_law_1.01,0.3043071985244751
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,7168,2048,8,256,8,2,balanced,0.849455992380778
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,256,4,4,power_law_1.2,3.806284713745117
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,7168,2048,8,256,8,2,balanced,0.1265066663424174
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,7168,2048,8,256,8,2,power_law_1.01,0.06082559823989868
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,7168,2048,8,256,8,2,power_law_1.01,0.3162175893783569
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,7168,2048,8,256,8,2,balanced,0.18140800793965658
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,7168,2048,8,256,8,2,power_law_1.01,0.08968960046768189
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,7168,2048,8,256,8,2,balanced,0.7234559853871664
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,7168,2048,8,256,8,2,power_law_1.01,0.3355711936950684
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,256,4,4,power_law_1.2,5.1245887756347654
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,7168,2048,8,256,8,2,balanced,0.27632532517115277
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,7168,2048,8,256,8,2,power_law_1.01,0.35647358894348147
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,7168,2048,8,256,8,2,power_law_1.01,0.11611520051956177
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,7168,2048,8,256,8,2,balanced,0.2836373249689738
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,7168,2048,8,256,8,2,power_law_1.01,0.36708478927612304
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,7168,2048,8,256,8,2,balanced,1.1331626574198406
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,256,4,4,power_law_1.2,8.415513610839843
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,7168,2048,8,256,8,2,power_law_1.01,0.14584319591522216
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,7168,2048,8,256,8,2,power_law_1.01,0.3811327934265137
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,7168,2048,8,256,8,2,balanced,0.2893226742744446
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,7168,2048,8,256,8,2,power_law_1.01,0.18240640163421631
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,7168,2048,8,256,8,2,power_law_1.01,0.4036736011505127
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,7168,2048,8,256,8,2,balanced,1.0173973242441814
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,7168,2048,8,256,8,2,balanced,0.28958932558695477
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,7168,2048,8,256,8,2,power_law_1.01,0.19128960371017456
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,7168,2048,8,256,8,2,power_law_1.01,0.447219181060791
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,7168,2048,8,256,8,2,balanced,0.2946453293164571
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,256,4,4,power_law_1.2,19.192658996582033
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,7168,2048,8,256,8,2,power_law_1.01,0.43749117851257324
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,7168,2048,8,256,8,2,power_law_1.01,0.2052544116973877
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,7168,2048,8,256,8,2,balanced,0.3004960020383199
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,7168,2048,8,256,8,2,power_law_1.01,0.5154816150665283
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,7168,2048,8,256,8,2,balanced,1.3857547442118328
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,7168,2048,8,256,8,2,power_law_1.01,0.2092672109603882
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,7168,2048,8,256,8,2,balanced,0.31037867069244385
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,7168,2048,8,256,8,2,power_law_1.01,0.5564735889434814
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,7168,2048,8,256,8,2,power_law_1.01,0.22188799381256102
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,7168,2048,8,256,8,2,balanced,0.31894399722417194
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,7168,2048,8,256,8,2,power_law_1.01,0.6429632186889649
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,7168,2048,8,256,8,2,balanced,1.2834400335947673
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,7168,2048,8,256,8,2,power_law_1.01,0.700767993927002
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,7168,2048,8,256,8,2,power_law_1.01,0.2396224021911621
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,7168,2048,8,256,8,2,balanced,0.328874667485555
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,7168,2048,8,256,8,2,power_law_1.01,0.8433024406433105
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,7168,2048,8,256,8,2,power_law_1.01,0.24004480838775635
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,7168,2048,8,256,8,2,balanced,0.34676798184712726
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,7168,2048,8,256,8,2,power_law_1.01,0.9585344314575195
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,7168,2048,8,256,8,2,power_law_1.01,0.2670720100402832
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,7168,2048,8,256,8,2,balanced,0.3601866563161214
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,7168,2048,8,256,8,2,power_law_1.01,1.2467647552490235
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,7168,2048,8,256,8,2,balanced,1.9507253964742024
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,7168,2048,8,256,8,2,power_law_1.01,0.2828160047531128
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,7168,2048,8,256,8,2,power_law_1.01,1.540384006500244
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,7168,2048,8,256,8,2,balanced,0.3866506814956665
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,7168,2048,8,256,8,2,power_law_1.01,0.3038464069366455
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,7168,2048,8,256,8,2,power_law_1.01,2.2198463439941407
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,7168,2048,8,256,8,2,balanced,1.8548906644185383
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,7168,2048,8,256,8,2,power_law_1.01,2.7801984786987304
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,7168,2048,8,256,8,2,power_law_1.01,0.3065727949142456
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,7168,2048,8,256,8,2,power_law_1.01,0.3555327892303467
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,7168,2048,8,256,8,2,power_law_1.01,3.5423233032226564
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,7168,2048,8,256,8,2,power_law_1.01,0.3934783935546875
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,7168,2048,8,256,8,2,balanced,0.4798080126444499
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,7168,2048,8,256,8,2,power_law_1.01,5.649766540527343
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,7168,2048,8,256,8,2,power_law_1.01,0.48267521858215334
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,7168,2048,8,256,8,2,power_law_1.01,0.5196991920471191
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,7168,2048,8,256,8,2,power_law_1.01,10.771526336669922
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,7168,2048,8,256,8,2,balanced,2.46834135055542
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,7168,2048,8,256,8,2,power_law_1.01,0.6570816040039062
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,7168,2048,8,256,8,2,power_law_1.01,0.7809279918670654
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,7168,2048,8,256,8,2,power_law_1.01,0.08486400246620178
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,7168,2048,8,256,8,2,balanced,2.311957359313965
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,7168,2048,8,256,8,2,power_law_1.01,1.089023971557617
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,7168,2048,8,256,8,2,power_law_1.01,0.09690240025520325
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,7168,2048,8,256,8,2,power_law_1.01,1.4157567977905274
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,256,8,2,balanced,0.5935253302256266
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,7168,2048,8,256,8,2,power_law_1.01,0.10217599868774414
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,7168,2048,8,256,8,2,power_law_1.01,1.9147327423095704
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,256,8,2,balanced,0.7395466963450114
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,7168,2048,8,256,8,2,power_law_1.01,0.11509120464324951
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,7168,2048,8,256,8,2,power_law_1.01,2.5104448318481447
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,7168,2048,8,256,8,2,power_law_1.2,0.06673280000686646
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,7168,2048,8,256,8,2,power_law_1.01,0.1519487977027893
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,7168,2048,8,256,8,2,power_law_1.01,3.0991615295410155
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,256,8,2,balanced,0.8205866813659668
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,7168,2048,8,256,8,2,power_law_1.2,0.07979519963264466
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,7168,2048,8,256,8,2,power_law_1.01,0.17941759824752807
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,7168,2048,8,256,8,2,balanced,3.2142772674560547
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,7168,2048,8,256,8,2,power_law_1.2,0.0735360026359558
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,7168,2048,8,256,8,2,power_law_1.01,0.21728639602661132
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,7168,2048,8,256,8,2,power_law_1.01,4.906521606445312
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,7168,2048,8,256,8,2,power_law_1.01,0.23495678901672362
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,7168,2048,8,256,8,2,power_law_1.2,0.10598399639129638
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,256,8,2,balanced,1.174570639928182
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,7168,2048,8,256,8,2,balanced,3.018687884012858
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,7168,2048,8,256,8,2,power_law_1.01,0.23877758979797364
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,7168,2048,8,256,8,2,power_law_1.2,0.1518847942352295
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,7168,2048,8,256,8,2,power_law_1.01,10.013247680664062
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,7168,2048,8,256,8,2,power_law_1.2,0.18519680500030516
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,7168,2048,8,256,8,2,power_law_1.01,0.24940159320831298
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,256,8,2,balanced,1.4030772844950359
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,7168,2048,8,256,8,2,power_law_1.2,0.2705215930938721
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,7168,2048,8,256,8,2,power_law_1.01,0.2665535926818848
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,7168,2048,8,256,8,2,power_law_1.2,0.2973504066467285
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,7168,2048,8,256,8,2,power_law_1.01,0.28517119884490966
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,7168,2048,8,256,8,2,power_law_1.2,0.30318078994750974
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,7168,2048,8,256,8,2,power_law_1.01,0.30383360385894775
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,256,8,2,balanced,2.1858506202697754
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,7168,2048,8,256,8,2,power_law_1.2,0.3161535978317261
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,7168,2048,8,256,8,2,power_law_1.01,0.3377408027648926
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,7168,2048,8,256,8,2,power_law_1.01,0.37173759937286377
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,7168,2048,8,256,8,2,power_law_1.2,0.33879680633544923
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,7168,2048,8,256,8,2,power_law_1.01,0.3960319995880127
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,7168,2048,8,256,8,2,power_law_1.2,0.3652031898498535
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,7168,2048,8,256,8,2,power_law_1.01,0.45569920539855957
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,256,8,2,balanced,2.6865228017171225
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,7168,2048,8,256,8,2,power_law_1.2,0.3637439966201782
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,7168,2048,8,256,8,2,balanced,4.773802757263184
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,7168,2048,8,256,8,2,power_law_1.2,0.38840320110321047
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,7168,2048,8,256,8,2,power_law_1.2,0.4211264133453369
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,7168,2048,8,256,8,2,power_law_1.01,0.5645887851715088
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,7168,2048,8,256,8,2,power_law_1.2,0.46924800872802735
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,7168,2048,8,256,8,2,balanced,4.499754587809245
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,7168,2048,8,256,8,2,power_law_1.2,0.46491518020629885
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,256,8,2,power_law_1.01,0.6362815856933594
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,256,8,2,balanced,3.929343859354655
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,7168,2048,8,256,8,2,power_law_1.2,0.5320256233215332
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,256,8,2,power_law_1.01,0.7955840110778809
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,7168,2048,8,256,8,2,power_law_1.2,0.5646207809448243
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,256,8,2,power_law_1.01,0.9776703834533691
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,7168,2048,8,256,8,2,power_law_1.2,0.6806272029876709
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,256,8,2,power_law_1.01,1.294809627532959
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,7168,2048,8,256,8,2,power_law_1.2,0.728326416015625
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,256,8,2,power_law_1.01,1.6572736740112304
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,7168,2048,8,256,8,2,power_law_1.2,0.8875136375427246
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,256,8,2,power_law_1.01,2.3865535736083983
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,7168,2048,8,256,8,2,power_law_1.2,1.0225728034973145
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,256,8,2,balanced,5.1669918696085615
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,7168,2048,8,256,8,2,power_law_1.2,1.279539203643799
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,256,8,2,power_law_1.01,3.094611167907715
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,7168,2048,8,256,8,2,power_law_1.2,1.626848030090332
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,256,8,2,power_law_1.01,4.1299903869628904
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,7168,2048,8,256,8,2,power_law_1.2,2.3056447982788084
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,256,8,2,power_law_1.01,5.985868835449219
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,7168,2048,8,256,8,2,power_law_1.2,3.033683204650879
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,256,8,2,power_law_1.01,6.89916763305664
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,7168,2048,8,256,8,2,power_law_1.2,3.623513412475586
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,256,8,2,power_law_1.01,11.240166473388673
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,7168,2048,8,256,8,2,power_law_1.2,5.927628707885742
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,256,8,2,balanced,6.3972320556640625
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,7168,2048,8,256,8,2,power_law_1.2,11.59815673828125
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,256,8,2,power_law_1.01,21.68642578125
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,7168,2048,8,256,8,2,balanced,9.385818481445312
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,7168,2048,8,256,8,2,balanced,8.87390391031901
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,256,8,2,balanced,10.2008908589681
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,7168,2048,8,256,8,2,power_law_1.2,0.05556480288505554
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,7168,2048,8,256,8,2,power_law_1.2,0.06575359702110291
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,7168,2048,8,256,8,2,power_law_1.2,0.061273598670959474
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,7168,2048,8,256,8,2,power_law_1.2,0.08439040184020996
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,7168,2048,8,256,8,2,power_law_1.2,0.10931199789047241
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,7168,2048,8,256,8,2,power_law_1.2,0.1299072027206421
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,7168,2048,8,256,8,2,power_law_1.2,0.18202240467071534
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,7168,2048,8,256,8,2,power_law_1.2,0.1887488007545471
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,7168,2048,8,256,8,2,power_law_1.2,0.2035775899887085
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,7168,2048,8,256,8,2,power_law_1.2,0.2028736114501953
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,7168,2048,8,256,8,2,power_law_1.2,0.22323839664459227
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,7168,2048,8,256,8,2,power_law_1.2,0.23615360260009766
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,7168,2048,8,256,8,2,power_law_1.2,0.24971520900726318
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,7168,2048,8,256,8,2,power_law_1.2,0.08479999899864196
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,7168,2048,8,256,8,2,power_law_1.2,0.2707904100418091
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,7168,2048,8,256,8,2,power_law_1.2,0.2960959911346436
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,7168,2048,8,256,8,2,power_law_1.2,0.09639679789543151
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,7168,2048,8,256,8,2,power_law_1.2,0.3132031917572021
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,7168,2048,8,256,8,2,power_law_1.2,0.09627519845962525
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,7168,2048,8,256,8,2,power_law_1.2,0.31152000427246096
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,7168,2048,8,256,8,2,power_law_1.2,0.10759040117263793
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,7168,2048,8,256,8,2,power_law_1.2,0.36613759994506834
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,7168,2048,8,256,8,2,power_law_1.2,0.1366719961166382
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,7168,2048,8,256,8,2,power_law_1.2,0.4137983798980713
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,7168,2048,8,256,8,2,power_law_1.2,0.16227200031280517
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,7168,2048,8,256,8,2,power_law_1.2,0.21397120952606202
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,7168,2048,8,256,8,2,power_law_1.2,0.49704318046569823
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,256,8,2,balanced,20.353621164957683
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,7168,2048,8,256,8,2,power_law_1.2,0.22878720760345458
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,7168,2048,8,256,8,2,power_law_1.2,0.5499839782714844
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,7168,2048,8,256,8,2,power_law_1.2,0.23914880752563478
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,7168,2048,8,256,8,2,power_law_1.2,0.7082240104675293
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,7168,2048,8,256,8,2,power_law_1.2,0.26051840782165525
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,7168,2048,8,256,16,1,balanced,0.0735093355178833
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,7168,2048,8,256,8,2,power_law_1.2,0.838809585571289
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,7168,2048,8,256,8,2,power_law_1.2,0.2747584104537964
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,7168,2048,8,256,8,2,power_law_1.2,1.1373760223388671
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,7168,2048,8,256,16,1,balanced,0.07331199944019318
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,7168,2048,8,256,8,2,power_law_1.2,0.29141759872436523
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,7168,2048,8,256,16,1,balanced,0.09416533509890239
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,7168,2048,8,256,8,2,power_law_1.2,1.4128640174865723
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,7168,2048,8,256,8,2,power_law_1.2,0.3053951978683472
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,7168,2048,8,256,16,1,balanced,0.1486293375492096
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,7168,2048,8,256,8,2,power_law_1.2,2.005625534057617
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,7168,2048,8,256,8,2,power_law_1.2,0.34114561080932615
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,7168,2048,8,256,16,1,balanced,0.245253324508667
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,7168,2048,8,256,8,2,power_law_1.2,0.37325439453125
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,7168,2048,8,256,8,2,power_law_1.2,2.5504512786865234
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,7168,2048,8,256,8,2,power_law_1.2,0.39920639991760254
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,7168,2048,8,256,16,1,balanced,0.43915732701619464
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,7168,2048,8,256,8,2,power_law_1.2,3.3437374114990233
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,7168,2048,8,256,8,2,power_law_1.2,0.4508927822113037
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,7168,2048,8,256,16,1,balanced,0.4439786672592163
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,7168,2048,8,256,16,1,balanced,0.43785067399342853
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,7168,2048,8,256,8,2,power_law_1.2,4.9783935546875
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,7168,2048,8,256,8,2,power_law_1.2,0.58919677734375
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,7168,2048,8,256,16,1,balanced,0.44069333871205646
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,7168,2048,8,256,16,1,balanced,0.43953601519266766
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,7168,2048,8,256,8,2,power_law_1.2,9.850316619873047
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,7168,2048,8,256,16,1,balanced,0.4432320197423299
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,256,8,2,power_law_1.2,0.645747184753418
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,7168,2048,8,256,16,1,balanced,0.4508320093154907
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,7168,2048,8,256,16,1,balanced,0.4542773167292277
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,256,8,2,power_law_1.2,0.8288640022277832
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,7168,2048,8,256,16,1,balanced,0.461082657178243
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,256,8,2,power_law_1.2,0.9769727706909179
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,7168,2048,8,256,16,1,balanced,0.4711093505223592
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,256,8,2,power_law_1.2,1.3160256385803222
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,7168,2048,8,256,16,1,balanced,0.47781864802042645
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,7168,2048,8,256,16,1,balanced,0.493008017539978
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,256,8,2,power_law_1.2,1.8026304244995117
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,7168,2048,8,256,16,1,balanced,0.5566933155059814
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,256,8,2,power_law_1.2,2.494700813293457
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,7168,2048,8,256,16,1,balanced,0.6299093166987101
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,256,8,2,power_law_1.2,3.381062316894531
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,7168,2048,8,256,16,1,balanced,0.726143995920817
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,256,8,2,power_law_1.2,4.666067123413086
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,7168,2048,8,256,16,1,balanced,0.7936053276062012
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,256,8,2,power_law_1.2,6.208134460449219
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,256,8,2,power_law_1.2,7.2694847106933596
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,7168,2048,8,256,16,1,balanced,1.0064480304718018
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,256,8,2,power_law_1.2,12.2412353515625
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,7168,2048,8,256,16,1,balanced,1.2535786628723145
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,256,8,2,power_law_1.2,24.6876220703125
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,7168,2048,8,256,16,1,balanced,1.7668320337931316
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,7168,2048,8,256,16,1,balanced,2.206826686859131
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,7168,2048,8,256,16,1,balanced,0.05769066512584686
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,7168,2048,8,256,16,1,balanced,0.06301333506902058
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,7168,2048,8,256,16,1,power_law_1.01,0.07036160230636597
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,7168,2048,8,256,16,1,balanced,3.195237477620443
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,7168,2048,8,256,16,1,balanced,0.08107199768225352
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,7168,2048,8,256,16,1,power_law_1.01,0.07025920152664185
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,7168,2048,8,256,16,1,balanced,0.11774933338165283
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,7168,2048,8,256,16,1,power_law_1.01,0.078438401222229
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,7168,2048,8,256,16,1,balanced,0.18292800585428873
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,7168,2048,8,256,16,1,power_law_1.01,0.053395199775695804
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,7168,2048,8,256,16,1,power_law_1.01,0.12673280239105225
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,7168,2048,8,256,16,1,balanced,0.12372266252835591
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,7168,2048,8,256,16,1,balanced,0.3104853431383769
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,7168,2048,8,256,16,1,power_law_1.01,0.06056320071220398
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,7168,2048,8,256,16,1,power_law_1.01,0.17964160442352295
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,7168,2048,8,256,16,1,balanced,0.13269333044687906
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,7168,2048,8,256,16,1,balanced,0.31463466087977093
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,7168,2048,8,256,16,1,power_law_1.01,0.06540799736976624
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,7168,2048,8,256,16,1,power_law_1.01,0.2261375904083252
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,7168,2048,8,256,16,1,balanced,0.1470080018043518
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,7168,2048,8,256,16,1,balanced,0.3147040009498596
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,7168,2048,8,256,16,1,power_law_1.01,0.09976320266723633
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,7168,2048,8,256,16,1,balanced,0.17885865767796835
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,7168,2048,8,256,16,1,power_law_1.01,0.31604480743408203
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,7168,2048,8,256,16,1,balanced,0.3181920051574707
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,7168,2048,8,256,16,1,balanced,3.9361279805501304
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,7168,2048,8,256,16,1,balanced,0.24574933449427286
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,7168,2048,8,256,16,1,power_law_1.01,0.1354688048362732
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,7168,2048,8,256,16,1,balanced,0.32052799065907794
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,7168,2048,8,256,16,1,power_law_1.01,0.33729920387268064
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,7168,2048,8,256,16,1,balanced,0.3757760127385457
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,7168,2048,8,256,16,1,power_law_1.01,0.17272959947586058
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,7168,2048,8,256,16,1,balanced,0.32464534044265747
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,7168,2048,8,256,16,1,power_law_1.01,0.3452608108520508
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,7168,2048,8,256,16,1,balanced,0.39071468512217206
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,7168,2048,8,256,16,1,power_law_1.01,0.2304896116256714
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,7168,2048,8,256,16,1,balanced,0.33127466837565106
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,7168,2048,8,256,16,1,power_law_1.01,0.3540800094604492
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,7168,2048,8,256,16,1,balanced,0.40220268567403156
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,7168,2048,8,256,16,1,power_law_1.01,0.23844480514526367
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,7168,2048,8,256,16,1,balanced,0.33763734499613446
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,7168,2048,8,256,16,1,power_law_1.01,0.37817599773406985
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,7168,2048,8,256,16,1,balanced,0.40886934598286945
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,7168,2048,8,256,16,1,power_law_1.01,0.2551104068756104
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,7168,2048,8,256,16,1,balanced,0.3455306688944499
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,7168,2048,8,256,16,1,balanced,0.4079306523005168
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,7168,2048,8,256,16,1,power_law_1.01,0.38842880725860596
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,7168,2048,8,256,16,1,power_law_1.01,0.2616384029388428
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,7168,2048,8,256,16,1,balanced,0.3567359844843547
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,7168,2048,8,256,16,1,balanced,0.4229653278986613
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,7168,2048,8,256,16,1,power_law_1.01,0.3971328020095825
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,7168,2048,8,256,16,1,power_law_1.01,0.2780416011810303
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,7168,2048,8,256,16,1,balanced,0.4386933247248332
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,7168,2048,8,256,16,1,balanced,0.36529068152109784
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,7168,2048,8,256,16,1,power_law_1.01,0.4196800231933594
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,7168,2048,8,256,16,1,power_law_1.01,0.30171520709991456
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,7168,2048,8,256,16,1,balanced,5.166229248046875
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,7168,2048,8,256,16,1,balanced,0.45209066073099774
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,7168,2048,8,256,16,1,balanced,0.39238933722178143
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,7168,2048,8,256,16,1,power_law_1.01,0.4469247817993164
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,7168,2048,8,256,16,1,power_law_1.01,0.30801279544830323
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,7168,2048,8,256,16,1,balanced,0.47783998648325604
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,7168,2048,8,256,16,1,balanced,0.45421334107716876
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,7168,2048,8,256,16,1,power_law_1.01,0.46846718788146974
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,7168,2048,8,256,16,1,power_law_1.01,0.3416960000991821
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,7168,2048,8,256,16,1,balanced,0.5264106591542562
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,7168,2048,8,256,16,1,power_law_1.01,0.5033279895782471
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,7168,2048,8,256,16,1,balanced,0.5230186780293783
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,7168,2048,8,256,16,1,power_law_1.01,0.3706367969512939
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,7168,2048,8,256,16,1,balanced,0.5642240047454834
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,7168,2048,8,256,16,1,power_law_1.01,0.6189760208129883
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,7168,2048,8,256,16,1,power_law_1.01,0.3958271980285645
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,7168,2048,8,256,16,1,balanced,0.5999253193537394
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,7168,2048,8,256,16,1,balanced,0.5998080174128214
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,7168,2048,8,256,16,1,power_law_1.01,0.6755839824676514
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,7168,2048,8,256,16,1,power_law_1.01,0.4004096031188965
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,7168,2048,8,256,16,1,balanced,0.6781973044077555
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,7168,2048,8,256,16,1,power_law_1.01,0.8042752265930175
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,7168,2048,8,256,16,1,power_law_1.01,0.48604798316955566
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,7168,2048,8,256,16,1,power_law_1.01,0.9275648117065429
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,7168,2048,8,256,16,1,power_law_1.01,0.5296576023101807
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,7168,2048,8,256,16,1,balanced,0.9020799795786539
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,7168,2048,8,256,16,1,balanced,0.7541066805521647
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,7168,2048,8,256,16,1,power_law_1.01,0.6326015949249267
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,7168,2048,8,256,16,1,power_law_1.01,1.1710016250610351
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,7168,2048,8,256,16,1,power_law_1.01,0.7338111877441407
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,7168,2048,8,256,16,1,power_law_1.01,1.371833610534668
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,7168,2048,8,256,16,1,balanced,1.1169119675954182
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,7168,2048,8,256,16,1,power_law_1.01,0.9348992347717285
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,7168,2048,8,256,16,1,power_law_1.01,1.8997888565063477
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,7168,2048,8,256,16,1,power_law_1.01,1.161689567565918
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,7168,2048,8,256,16,1,power_law_1.01,2.2227264404296876
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,7168,2048,8,256,16,1,balanced,7.394245147705078
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,7168,2048,8,256,16,1,power_law_1.01,1.5915583610534667
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,7168,2048,8,256,16,1,power_law_1.01,3.1597055435180663
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,256,16,1,balanced,0.9624853134155273
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,7168,2048,8,256,16,1,balanced,1.6088372866312664
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,7168,2048,8,256,16,1,power_law_1.01,2.0372735977172853
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,7168,2048,8,256,16,1,power_law_1.01,4.021017456054688
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,256,16,1,balanced,1.233514706293742
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,7168,2048,8,256,16,1,power_law_1.01,2.9293119430541994
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,7168,2048,8,256,16,1,power_law_1.01,4.901542282104492
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,256,16,1,balanced,1.3865440686543782
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,7168,2048,8,256,16,1,power_law_1.01,0.1095039963722229
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,7168,2048,8,256,16,1,power_law_1.01,3.7547073364257812
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,7168,2048,8,256,16,1,balanced,2.0789119402567544
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,7168,2048,8,256,16,1,power_law_1.01,7.464530944824219
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,7168,2048,8,256,16,1,power_law_1.01,0.1183616042137146
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,7168,2048,8,256,16,1,power_law_1.01,4.5820671081542965
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,256,16,1,balanced,2.0450612703959146
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,7168,2048,8,256,16,1,power_law_1.01,0.13742079734802246
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,7168,2048,8,256,16,1,power_law_1.01,7.064902496337891
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,7168,2048,8,256,16,1,power_law_1.01,14.56759033203125
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,7168,2048,8,256,16,1,power_law_1.01,0.16412800550460815
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,256,16,1,balanced,2.4595786730448403
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,7168,2048,8,256,16,1,power_law_1.01,0.20531840324401857
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,7168,2048,8,256,16,1,power_law_1.01,13.861042785644532
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,7168,2048,8,256,16,1,power_law_1.01,0.24260480403900148
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,7168,2048,8,256,16,1,balanced,3.0381387074788413
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,7168,2048,8,256,16,1,power_law_1.01,0.304915189743042
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,256,16,1,balanced,3.8363574345906577
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,7168,2048,8,256,16,1,power_law_1.01,0.3256448030471802
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,7168,2048,8,256,16,1,power_law_1.01,0.33879680633544923
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,7168,2048,8,256,16,1,power_law_1.01,0.3464576005935669
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,7168,2048,8,256,16,1,power_law_1.2,0.07030400037765502
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,7168,2048,8,256,16,1,power_law_1.01,0.3818367958068848
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,256,16,1,balanced,4.7547041575113935
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,7168,2048,8,256,16,1,power_law_1.2,0.07039999961853027
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,7168,2048,8,256,16,1,power_law_1.01,0.4035967826843262
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,7168,2048,8,256,16,1,balanced,3.7178452809651694
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,7168,2048,8,256,16,1,power_law_1.2,0.07738879919052125
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,7168,2048,8,256,16,1,power_law_1.01,0.423308801651001
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,7168,2048,8,256,16,1,power_law_1.2,0.11940480470657348
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,7168,2048,8,256,16,1,power_law_1.01,0.4787007808685303
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,7168,2048,8,256,16,1,power_law_1.2,0.1530303955078125
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,7168,2048,8,256,16,1,power_law_1.01,0.533574390411377
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,7168,2048,8,256,16,1,power_law_1.2,0.20777599811553954
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,256,16,1,balanced,7.064837137858073
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,7168,2048,8,256,16,1,power_law_1.2,0.30373120307922363
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,7168,2048,8,256,16,1,power_law_1.01,0.5839295864105225
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,7168,2048,8,256,16,1,power_law_1.2,0.3285887956619263
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,7168,2048,8,256,16,1,power_law_1.01,0.6860799789428711
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,7168,2048,8,256,16,1,power_law_1.2,0.337228798866272
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,7168,2048,8,256,16,1,power_law_1.2,0.3589951992034912
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,7168,2048,8,256,16,1,balanced,14.525360107421875
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,7168,2048,8,256,16,1,balanced,4.908672014872233
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,7168,2048,8,256,16,1,power_law_1.01,0.8592255592346192
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,7168,2048,8,256,16,1,power_law_1.2,0.3701247930526733
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,7168,2048,8,256,16,1,power_law_1.2,0.3981568098068237
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,7168,2048,8,256,16,1,power_law_1.2,0.4087039947509766
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,256,16,1,power_law_1.01,0.961945629119873
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,256,16,1,balanced,9.354917526245117
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,7168,2048,8,256,16,1,power_law_1.2,0.053414398431777955
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,7168,2048,8,256,16,1,power_law_1.2,0.4324480056762695
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,256,16,1,power_law_1.01,1.2591039657592773
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,7168,2048,8,256,16,1,power_law_1.2,0.060652798414230345
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,7168,2048,8,256,16,1,power_law_1.2,0.4601856231689453
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,7168,2048,8,256,16,1,power_law_1.2,0.06776319742202759
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,256,16,1,power_law_1.01,1.562828826904297
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,7168,2048,8,256,16,1,power_law_1.2,0.09329919815063477
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,7168,2048,8,256,16,1,power_law_1.2,0.47275519371032715
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,7168,2048,8,256,16,1,power_law_1.2,0.12195199728012085
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,256,16,1,power_law_1.01,2.1431552886962892
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,7168,2048,8,256,16,1,power_law_1.2,0.5322303771972656
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,7168,2048,8,256,16,1,power_law_1.2,0.157478404045105
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,256,16,1,power_law_1.01,2.6881088256835937
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,7168,2048,8,256,16,1,power_law_1.2,0.227020788192749
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,7168,2048,8,256,16,1,power_law_1.2,0.6379007816314697
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,7168,2048,8,256,16,1,power_law_1.2,0.23821439743041992
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,7168,2048,8,256,16,1,power_law_1.2,0.6930880069732666
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,256,16,1,power_law_1.01,3.831430435180664
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,7168,2048,8,256,16,1,power_law_1.2,0.24741120338439943
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,7168,2048,8,256,16,1,power_law_1.2,0.25729920864105227
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,7168,2048,8,256,16,1,power_law_1.2,0.8207039833068848
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,256,16,1,power_law_1.01,4.96569595336914
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,256,16,1,balanced,11.66385014851888
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,7168,2048,8,256,16,1,power_law_1.2,0.28012800216674805
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,7168,2048,8,256,16,1,power_law_1.2,0.9469375610351562
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,7168,2048,8,256,16,1,power_law_1.2,0.3045120000839233
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,7168,2048,8,256,16,1,balanced,7.0868479410807295
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,256,16,1,power_law_1.01,7.2430274963378904
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,7168,2048,8,256,16,1,power_law_1.2,0.3144320011138916
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,7168,2048,8,256,16,1,power_law_1.2,1.1725119590759276
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,7168,2048,8,256,16,1,power_law_1.2,0.3454463958740234
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,7168,2048,8,256,16,1,power_law_1.2,1.4236736297607422
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,256,16,1,power_law_1.01,9.49411849975586
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,7168,2048,8,256,16,1,power_law_1.2,0.3747391939163208
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,7168,2048,8,256,16,1,power_law_1.2,1.9479488372802733
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,7168,2048,8,256,16,1,power_law_1.2,0.4020864009857178
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,7168,2048,8,256,16,1,power_law_1.2,0.4205632209777832
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,256,16,1,power_law_1.01,11.764044952392577
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,7168,2048,8,256,16,1,power_law_1.2,2.2694400787353515
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,7168,2048,8,256,16,1,power_law_1.2,0.49413118362426756
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,7168,2048,8,256,16,1,power_law_1.2,0.5507008075714112
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,7168,2048,8,256,16,1,power_law_1.2,3.1806463241577148
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,7168,2048,8,256,16,1,power_law_1.2,0.6513855934143067
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,256,16,1,power_law_1.01,18.559756469726562
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,7168,2048,8,256,16,1,power_law_1.2,0.7567808151245117
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,7168,2048,8,256,16,1,power_law_1.2,4.055193710327148
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,7168,2048,8,256,16,1,power_law_1.2,0.9746047973632812
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,7168,2048,8,256,16,1,power_law_1.2,5.079840087890625
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,7168,2048,8,256,16,1,power_law_1.2,1.1769856452941894
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,7168,2048,8,256,16,1,power_law_1.2,1.618943977355957
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,256,16,1,power_law_1.01,36.710446166992185
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,7168,2048,8,256,16,1,power_law_1.2,2.067462348937988
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,7168,2048,8,256,16,1,power_law_1.2,7.499212646484375
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,7168,2048,8,256,16,1,power_law_1.2,2.97326717376709
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,256,16,1,balanced,18.446735382080078
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,7168,2048,8,256,16,1,power_law_1.2,3.7921791076660156
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,7168,2048,8,256,16,1,power_law_1.2,14.57073974609375
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,7168,2048,8,256,16,1,power_law_1.2,4.701395034790039
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,7168,2048,8,256,16,1,power_law_1.2,7.074758148193359
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,7168,2048,8,256,16,1,power_law_1.2,13.851834106445313
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,7168,2048,8,256,16,1,balanced,13.857130686442057
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,256,16,1,balanced,36.70845286051432
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,7168,2048,8,256,16,1,power_law_1.2,0.10976639986038209
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,7168,2048,8,256,16,1,power_law_1.2,0.11800960302352906
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,7168,2048,8,256,16,1,power_law_1.2,0.1368831992149353
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,2048,768,8,128,1,16,balanced,0.02476799984773
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,7168,2048,8,256,16,1,power_law_1.2,0.16134400367736818
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,2048,768,8,128,1,16,balanced,0.025013332565625507
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,7168,2048,8,256,16,1,power_law_1.2,0.18652160167694093
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,2048,768,8,128,1,16,balanced,0.025685332715511322
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,7168,2048,8,256,16,1,power_law_1.2,0.2236543893814087
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,2048,768,8,128,1,16,balanced,0.029498666524887085
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,7168,2048,8,256,16,1,power_law_1.2,0.3021183967590332
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,2048,768,8,128,1,16,balanced,0.04497600098450979
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,7168,2048,8,256,16,1,power_law_1.2,0.314355206489563
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,2048,768,8,128,1,16,balanced,0.046256000796953835
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,2048,768,8,128,1,16,balanced,0.046666666865348816
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,7168,2048,8,256,16,1,power_law_1.2,0.3343744039535522
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,2048,768,8,128,1,16,balanced,0.04620266457398733
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,7168,2048,8,256,16,1,power_law_1.2,0.34603519439697267
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,2048,768,8,128,1,16,balanced,0.04656533400217692
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,7168,2048,8,256,16,1,power_law_1.2,0.3761791944503784
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,2048,768,8,128,1,16,balanced,0.046821330984433494
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,7168,2048,8,256,16,1,power_law_1.2,0.41371521949768064
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,2048,768,8,128,1,16,balanced,0.047322665651639305
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,7168,2048,8,256,16,1,power_law_1.2,0.4300032138824463
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,2048,768,8,128,1,16,balanced,0.048485333720842995
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,7168,2048,8,256,16,1,power_law_1.2,0.4804224014282227
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,2048,768,8,128,1,16,balanced,0.04926399886608124
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,2048,768,8,128,1,16,balanced,0.049839998284975685
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,7168,2048,8,256,16,1,power_law_1.2,0.5435328006744384
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,2048,768,8,128,1,16,balanced,0.05392000079154968
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,2048,768,8,128,1,16,balanced,0.03002133220434189
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,7168,2048,8,256,16,1,power_law_1.2,0.599123191833496
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,2048,768,8,128,1,16,balanced,0.055125330885251365
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,2048,768,8,128,1,16,balanced,0.029818666477998097
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,7168,2048,8,256,16,1,power_law_1.2,0.6862656116485596
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,2048,768,8,128,1,16,balanced,0.05681600173314413
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,2048,768,8,128,1,16,balanced,0.03224000086386999
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,2048,768,8,128,1,16,balanced,0.033471999069054924
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,2048,768,8,128,1,16,balanced,0.05811200042565664
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,7168,2048,8,256,16,1,power_law_1.2,0.8696895599365234
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,2048,768,8,128,1,16,balanced,0.035589332381884255
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,2048,768,8,128,1,16,balanced,0.06172266602516174
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,2048,768,8,128,1,16,balanced,0.0365226666132609
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,2048,768,8,128,1,16,balanced,0.03669866671164831
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,2048,768,8,128,1,16,balanced,0.06343466540177663
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,2048,768,8,128,1,16,balanced,0.036490666369597115
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,256,16,1,power_law_1.2,0.9737471580505371
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,2048,768,8,128,1,16,balanced,0.03665599972009659
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,256,16,1,power_law_1.2,1.2747200012207032
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,2048,768,8,128,1,16,balanced,0.07035733262697856
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,2048,768,8,128,1,16,balanced,0.03765333443880081
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,256,16,1,power_law_1.2,1.5658047676086426
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,2048,768,8,128,1,16,balanced,0.03734933336575826
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,2048,768,8,128,1,16,balanced,0.037690666814645134
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,2048,768,8,128,1,16,balanced,0.08222400148709615
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,256,16,1,power_law_1.2,2.163295936584473
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,2048,768,8,128,1,16,balanced,0.03874133278926214
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,2048,768,8,128,1,16,balanced,0.04045866678158442
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,256,16,1,power_law_1.2,2.7081087112426756
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,2048,768,8,128,1,16,balanced,0.04411733150482178
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,2048,768,8,128,1,16,balanced,0.08702400326728821
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,256,16,1,power_law_1.2,3.8296321868896483
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,2048,768,8,128,1,16,balanced,0.042634665966033936
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,2048,768,8,128,1,16,balanced,0.04739200075467428
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,256,16,1,power_law_1.2,4.954771041870117
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,2048,768,8,128,1,16,balanced,0.05093866586685181
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,2048,768,8,128,1,16,balanced,0.12313600381215413
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,256,16,1,power_law_1.2,7.237638092041015
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,2048,768,8,128,1,16,balanced,0.05714133381843567
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,256,16,1,power_law_1.2,9.485842895507812
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,2048,768,8,128,1,16,balanced,0.06286933521429698
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,2048,768,8,128,1,16,balanced,0.0719413310289383
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,256,16,1,power_law_1.2,11.762067413330078
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,2048,768,8,128,1,16,balanced,0.13875733812650046
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,2048,768,8,128,1,16,balanced,0.08628799517949422
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,256,16,1,power_law_1.2,18.538284301757812
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,2048,768,8,128,1,16,balanced,0.09676266709963481
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,2048,768,8,128,1,16,balanced,0.18929066260655722
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,256,16,1,power_law_1.2,36.646539306640626
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,2048,768,8,128,1,16,balanced,0.13192533453305563
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,2048,768,8,128,1,16,balanced,0.024458666642506916
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,2048,768,8,128,1,16,power_law_1.01,0.041657599806785586
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,2048,768,8,128,1,16,power_law_1.01,0.03950079977512359
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,2048,768,8,128,1,16,balanced,0.024608001112937927
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,2048,768,8,128,1,16,power_law_1.01,0.03560959994792938
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,2048,768,8,128,1,16,balanced,0.02500266581773758
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,2048,768,8,128,1,16,power_law_1.01,0.028147199749946596
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,2048,768,8,128,1,16,power_law_1.01,0.03425920009613037
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,2048,768,8,128,1,16,balanced,0.15426666537920633
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,2048,768,8,128,1,16,balanced,0.02699733277161916
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,2048,768,8,128,1,16,power_law_1.01,0.03485440015792847
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,2048,768,8,128,1,16,power_law_1.01,0.03282560110092163
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,2048,768,8,128,1,16,balanced,0.029648000995318096
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,2048,768,8,128,1,16,power_law_1.01,0.03769600093364715
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,2048,768,8,128,1,16,balanced,0.2149440050125122
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,2048,768,8,128,1,16,power_law_1.01,0.033004799485206605
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,2048,768,8,128,1,16,balanced,0.03091199944416682
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,2048,768,8,128,1,16,power_law_1.01,0.043884798884391785
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,2048,768,8,128,1,16,power_law_1.01,0.034745600819587705
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,2048,768,8,128,1,16,balanced,0.030784000953038532
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,2048,768,8,128,1,16,power_law_1.01,0.044563201069831845
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,2048,768,8,128,1,16,power_law_1.01,0.03603839874267578
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,2048,768,8,128,1,16,balanced,0.030794667700926464
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,2048,768,8,128,1,16,power_law_1.01,0.0457152009010315
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,2048,768,8,128,1,16,power_law_1.01,0.036160001158714296
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,2048,768,8,128,1,16,balanced,0.2153759996096293
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,2048,768,8,128,1,16,balanced,0.030778666337331135
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,2048,768,8,128,1,16,power_law_1.01,0.02932479977607727
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,2048,768,8,128,1,16,power_law_1.01,0.049209600687026976
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,2048,768,8,128,1,16,power_law_1.01,0.037990400195121767
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,2048,768,8,128,1,16,balanced,0.03172266731659571
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,2048,768,8,128,1,16,power_law_1.01,0.049318400025367734
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,2048,768,8,128,1,16,power_law_1.01,0.03925119936466217
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,2048,768,8,128,1,16,power_law_1.01,0.026745599508285523
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,2048,768,8,128,1,16,balanced,0.031914666295051575
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,2048,768,8,128,1,16,power_law_1.01,0.04118399918079376
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,2048,768,8,128,1,16,power_law_1.01,0.049542400240898135
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,2048,768,8,128,1,16,power_law_1.01,0.026188799738883974
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,2048,768,8,128,1,16,balanced,0.03290133426586787
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,2048,768,8,128,1,16,power_law_1.01,0.052249598503112796
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,2048,768,8,128,1,16,power_law_1.01,0.04289920032024384
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,2048,768,8,128,1,16,power_law_1.01,0.02969599962234497
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,2048,768,8,128,1,16,balanced,0.03358400116364161
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,2048,768,8,128,1,16,balanced,0.26683733860651654
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,2048,768,8,128,1,16,power_law_1.01,0.046054399013519286
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,2048,768,8,128,1,16,power_law_1.01,0.05127679705619812
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,2048,768,8,128,1,16,power_law_1.01,0.02911359965801239
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,2048,768,8,128,1,16,balanced,0.033626665671666466
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,2048,768,8,128,1,16,power_law_1.01,0.046419200301170346
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,2048,768,8,128,1,16,power_law_1.01,0.43319039344787597
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,2048,768,8,128,1,16,power_law_1.01,0.03080959916114807
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,2048,768,8,128,1,16,power_law_1.01,0.04818559885025024
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,2048,768,8,128,1,16,balanced,0.2669653296470642
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,2048,768,8,128,1,16,power_law_1.01,0.43476481437683107
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,2048,768,8,128,1,16,power_law_1.01,0.031206399202346802
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,2048,768,8,128,1,16,power_law_1.01,0.053235197067260744
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,2048,768,8,128,1,16,power_law_1.01,0.4382016181945801
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,2048,768,8,128,1,16,power_law_1.01,0.032051199674606325
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,2048,768,8,128,1,16,power_law_1.01,0.05507199764251709
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,2048,768,8,128,1,16,balanced,0.03940266619126002
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,2048,768,8,128,1,16,power_law_1.01,0.0654591977596283
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,2048,768,8,128,1,16,power_law_1.01,0.034457600116729735
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,2048,768,8,128,1,16,power_law_1.01,0.058329600095748904
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,2048,768,8,128,1,16,balanced,0.04002666721741358
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,2048,768,8,128,1,16,power_law_1.2,0.039577600359916684
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,2048,768,8,128,1,16,power_law_1.01,0.07138559818267823
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,2048,768,8,128,1,16,power_law_1.01,0.035743999481201175
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,2048,768,8,128,1,16,power_law_1.01,0.0644864022731781
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,2048,768,8,128,1,16,power_law_1.2,0.02754560112953186
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,2048,768,8,128,1,16,power_law_1.01,0.07994880080223084
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,2048,768,8,128,1,16,power_law_1.01,0.037887999415397645
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,2048,768,8,128,1,16,power_law_1.01,0.07320320010185241
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,2048,768,8,128,1,16,power_law_1.2,0.028435200452804565
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,2048,768,8,128,1,16,power_law_1.01,0.08835840225219727
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,2048,768,8,128,1,16,power_law_1.01,0.08229759931564332
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,2048,768,8,128,1,16,power_law_1.01,0.04079360067844391
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,2048,768,8,128,1,16,power_law_1.2,0.030956798791885377
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,2048,768,8,128,1,16,power_law_1.2,0.0383296012878418
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,2048,768,8,128,1,16,power_law_1.01,0.10190080404281616
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,2048,768,8,128,1,16,power_law_1.01,0.09915519952774048
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,2048,768,8,128,1,16,power_law_1.01,0.044512000679969785
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,2048,768,8,128,1,16,power_law_1.2,0.044172799587249754
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,2048,768,8,128,1,16,power_law_1.01,0.04712960124015808
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,2048,768,8,128,1,16,power_law_1.2,0.04341759979724884
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,2048,768,8,128,1,16,power_law_1.01,0.12368639707565307
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,2048,768,8,128,1,16,power_law_1.01,0.13824000358581542
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,2048,768,8,128,1,16,balanced,0.3288693428039551
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,2048,768,8,128,1,16,balanced,0.04348266621430715
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,2048,768,8,128,1,16,power_law_1.2,0.04696959853172302
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,2048,768,8,128,1,16,power_law_1.01,0.1413632035255432
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,2048,768,8,128,1,16,power_law_1.01,0.15364480018615723
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,2048,768,8,128,1,16,power_law_1.2,0.04844799935817719
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,2048,768,8,128,1,16,balanced,0.05014933149019877
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,2048,768,8,128,1,16,power_law_1.2,0.048556798696517946
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,2048,768,8,128,1,16,balanced,0.3983999888102214
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,2048,768,8,128,1,16,power_law_1.01,0.1906559944152832
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,2048,768,8,128,1,16,power_law_1.01,0.22760319709777832
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,2048,768,8,128,1,16,power_law_1.01,0.0514240026473999
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,2048,768,8,128,1,16,power_law_1.2,0.04961279928684235
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,2048,768,8,128,1,16,balanced,0.050570666790008545
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,2048,768,8,128,1,16,power_law_1.01,0.2377023935317993
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,2048,768,8,128,1,16,power_law_1.2,0.05229439735412598
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,2048,768,8,128,1,16,power_law_1.01,0.26730880737304685
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,2048,768,8,128,1,16,power_law_1.01,0.05497599840164184
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,2048,768,8,128,1,16,power_law_1.2,0.05307520031929016
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,2048,768,8,128,1,16,power_law_1.01,0.37465600967407225
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,2048,768,8,128,1,16,power_law_1.01,0.32179200649261475
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,2048,768,8,128,1,16,power_law_1.2,0.43011841773986814
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,2048,768,8,128,1,16,power_law_1.01,0.4615231990814209
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,2048,768,8,128,1,16,power_law_1.2,0.43048958778381347
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,2048,768,8,128,1,16,power_law_1.01,0.41008639335632324
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,2048,768,8,128,1,16,power_law_1.01,0.05803520083427429
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,2048,768,8,128,1,16,power_law_1.2,0.43656320571899415
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,2048,768,8,128,1,16,power_law_1.01,0.5906303882598877
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,2048,768,8,128,1,16,power_law_1.2,0.06726400256156921
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,2048,768,8,128,1,16,power_law_1.01,0.6058815956115723
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,2048,768,8,128,1,16,balanced,0.06408533453941345
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,2048,768,8,128,1,16,power_law_1.01,0.0705024003982544
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,2048,768,8,128,1,16,power_law_1.2,0.0754688024520874
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,2048,768,8,128,1,16,power_law_1.01,1.0263615608215333
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,2048,768,8,128,1,16,power_law_1.01,0.08332160115242004
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,2048,768,8,128,1,16,power_law_1.2,0.08461440205574036
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,2048,768,8,128,1,16,power_law_1.01,0.8121408462524414
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,2048,768,8,128,1,16,balanced,0.06974400083223979
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,2048,768,8,128,1,16,power_law_1.2,0.09533439874649048
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,2048,768,8,128,1,16,power_law_1.01,2.0674560546875
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,2048,768,8,128,1,16,power_law_1.2,0.12019840478897095
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,2048,768,8,128,1,16,power_law_1.01,1.5486463546752929
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,2048,768,8,128,1,16,power_law_1.01,0.09275519847869873
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,2048,768,8,128,1,16,power_law_1.2,0.1410752058029175
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,2048,768,8,128,1,16,balanced,0.09131200114885966
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,2048,768,8,128,1,16,power_law_1.2,0.18657920360565186
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,2048,768,8,128,1,16,power_law_1.01,0.10577919483184814
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,2048,768,8,128,1,16,power_law_1.2,0.2250368118286133
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,2048,768,8,128,1,16,power_law_1.01,0.1365504026412964
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,2048,768,8,128,1,16,balanced,0.5058613220850626
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,2048,768,8,128,1,16,power_law_1.2,0.2910016059875488
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,2048,768,8,128,1,16,balanced,0.10308266679445903
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,2048,768,8,128,1,16,power_law_1.2,0.49683198928833006
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,2048,768,8,128,1,16,power_law_1.01,0.16949119567871093
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,2048,768,8,128,1,16,power_law_1.2,0.6815743923187256
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,2048,768,8,128,1,16,power_law_1.01,0.30779519081115725
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,2048,768,8,128,1,16,power_law_1.2,0.7531392097473144
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,2048,768,8,128,1,16,power_law_1.01,0.3714047908782959
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,2048,768,8,128,1,16,power_law_1.2,1.3736000061035156
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,2048,768,8,128,1,16,balanced,0.13850133617719015
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,2048,768,8,128,1,16,power_law_1.2,3.6296512603759767
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,2048,768,8,128,1,16,power_law_1.01,0.5340415954589843
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,2048,768,8,128,1,16,balanced,0.17257066567738852
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,2048,768,8,128,1,16,power_law_1.01,0.7726975917816162
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,2048,768,8,128,1,16,power_law_1.01,1.0149375915527343
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,2048,768,8,128,1,16,power_law_1.01,1.3831104278564452
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,2048,768,8,128,1,16,power_law_1.01,3.048953628540039
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,2048,768,8,128,1,16,balanced,0.7494080066680908
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,2048,768,8,128,1,16,balanced,0.2577280004819234
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,2048,768,8,128,1,16,balanced,0.34114666779836017
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,2048,768,8,128,1,16,balanced,0.9565119743347168
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,2048,768,8,128,1,16,balanced,0.43114133675893146
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,2048,768,8,128,1,16,power_law_1.2,0.039392000436782836
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,2048,768,8,128,1,16,power_law_1.2,0.033395200967788696
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,2048,768,8,128,1,16,power_law_1.2,0.03289600014686585
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,2048,768,8,128,1,16,power_law_1.2,0.03260799944400787
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,2048,768,8,128,1,16,power_law_1.2,0.03543039858341217
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,2048,768,8,128,1,16,power_law_1.2,0.036601600050926206
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,2048,768,8,128,1,16,power_law_1.2,0.036595198512077334
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,2048,768,8,128,1,16,power_law_1.2,0.03857280015945434
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,2048,768,8,128,1,16,power_law_1.2,0.03982079923152924
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,2048,768,8,128,1,16,balanced,0.6698453426361084
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,2048,768,8,128,1,16,power_law_1.2,0.04170880019664765
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,2048,768,8,128,1,16,power_law_1.2,0.04483200013637543
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,2048,768,8,128,1,16,power_law_1.2,0.04607360064983368
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,2048,768,8,128,1,16,power_law_1.2,0.04728319942951202
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,2048,768,8,128,1,16,power_law_1.2,0.04948480129241943
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,2048,768,8,128,1,16,power_law_1.2,0.05470719933509827
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,2048,768,8,128,1,16,power_law_1.2,0.05731199979782105
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,2048,768,8,128,1,16,power_law_1.2,0.059910398721694944
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,2048,768,8,128,1,16,power_law_1.2,0.06656640172004699
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,2048,768,8,128,1,16,power_law_1.2,0.07596799731254578
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,2048,768,8,128,1,16,power_law_1.2,0.09408000111579895
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,2048,768,8,128,1,16,power_law_1.2,0.11944320201873779
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,2048,768,8,128,1,16,power_law_1.2,0.14154239892959594
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,2048,768,8,128,1,16,power_law_1.2,0.1900223970413208
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,2048,768,8,128,1,16,power_law_1.2,0.26053121089935305
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,2048,768,8,128,1,16,power_law_1.2,0.2873408079147339
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,2048,768,8,128,1,16,power_law_1.2,0.4164095878601074
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,2048,768,8,128,1,16,power_law_1.2,0.6389440059661865
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,2048,768,8,128,1,16,power_law_1.2,0.9290304183959961
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,2048,768,8,128,1,16,power_law_1.2,1.3914752006530762
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,2048,768,8,128,1,16,power_law_1.2,2.9929792404174806
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,2048,768,8,128,1,16,balanced,1.3109333515167236
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,2048,768,8,128,1,16,power_law_1.2,0.028960001468658448
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,2048,768,8,128,1,16,power_law_1.2,0.026169601082801818
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,2048,768,8,128,1,16,power_law_1.2,0.025913599133491515
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,2048,768,8,128,1,16,power_law_1.2,0.02826879918575287
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,2048,768,8,128,1,16,power_law_1.2,0.028652799129486085
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,2048,768,8,128,1,16,power_law_1.2,0.030880001187324525
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,2048,768,8,128,2,8,balanced,0.03072533259789149
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,2048,768,8,128,2,8,balanced,0.02298133323589961
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,2048,768,8,128,1,16,power_law_1.2,0.03125759959220886
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,2048,768,8,128,2,8,balanced,0.03089066594839096
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,2048,768,8,128,1,16,power_law_1.2,0.033107200264930726
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,2048,768,8,128,2,8,balanced,0.02332799881696701
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,2048,768,8,128,2,8,balanced,0.030954666435718536
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,2048,768,8,128,1,16,power_law_1.2,0.03443840146064758
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,2048,768,8,128,2,8,balanced,0.024304000039895374
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,2048,768,8,128,1,16,power_law_1.2,0.036364799737930296
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,2048,768,8,128,2,8,balanced,0.03357866654793421
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,2048,768,8,128,2,8,balanced,0.02870933214823405
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,2048,768,8,128,1,16,power_law_1.2,0.040268799662590025
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,2048,768,8,128,2,8,balanced,0.03763733307520548
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,2048,768,8,128,2,8,balanced,0.04018666595220566
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,2048,768,8,128,1,16,power_law_1.2,0.04188160002231598
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,2048,768,8,128,2,8,balanced,0.038218667109807335
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,2048,768,8,128,2,8,balanced,0.04218666752179464
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,2048,768,8,128,1,16,power_law_1.2,0.04312959909439087
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,2048,768,8,128,2,8,balanced,0.04427733520666758
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,2048,768,8,128,1,16,power_law_1.2,0.04938240051269531
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,2048,768,8,128,2,8,balanced,0.03862400104602178
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,2048,768,8,128,2,8,balanced,0.04277333120505015
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,2048,768,8,128,2,8,balanced,0.03810133288304011
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,2048,768,8,128,2,8,balanced,0.04188799858093262
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,2048,768,8,128,2,8,balanced,0.038389332592487335
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,2048,768,8,128,1,16,power_law_1.2,0.054176002740859985
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,2048,768,8,128,2,8,balanced,0.03862400104602178
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,2048,768,8,128,2,8,balanced,0.042405332128206887
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,2048,768,8,128,1,16,power_law_1.2,0.05740799903869629
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,2048,768,8,128,2,8,balanced,0.03915199885765711
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,2048,768,8,128,2,8,balanced,0.0429013321797053
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,2048,768,8,128,2,8,balanced,0.04390400151411692
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,2048,768,8,128,2,8,balanced,0.03913066784540812
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,2048,768,8,128,1,16,power_law_1.2,0.062003201246261595
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,2048,768,8,128,2,8,balanced,0.03997333347797394
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,2048,768,8,128,2,8,balanced,0.04475200176239014
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,2048,768,8,128,1,16,power_law_1.2,0.07310720086097718
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,2048,768,8,128,1,16,power_law_1.2,0.08375040292739869
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,2048,768,8,128,2,8,balanced,0.041050667564074196
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,2048,768,8,128,2,8,balanced,0.04566933214664459
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,2048,768,8,128,2,8,balanced,0.04554666578769684
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,2048,768,8,128,2,8,balanced,0.049914668003718056
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,2048,768,8,128,1,16,power_law_1.2,0.10357760190963745
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,2048,768,8,128,1,16,power_law_1.2,0.13521920442581176
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,2048,768,8,128,2,8,balanced,0.04576000074545542
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,2048,768,8,128,2,8,balanced,0.0498879998922348
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,2048,768,8,128,1,16,power_law_1.2,0.1937407970428467
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,2048,768,8,128,2,8,power_law_1.01,0.027219200134277345
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,2048,768,8,128,2,8,balanced,0.04986133178075155
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,2048,768,8,128,2,8,balanced,0.05741333464781443
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,2048,768,8,128,1,16,power_law_1.2,0.2224639892578125
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,2048,768,8,128,2,8,power_law_1.01,0.027833598852157592
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,2048,768,8,128,1,16,power_law_1.2,0.33974399566650393
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,2048,768,8,128,2,8,balanced,0.05435200035572052
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,2048,768,8,128,2,8,balanced,0.06107200185457865
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,2048,768,8,128,2,8,power_law_1.01,0.02651520073413849
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,2048,768,8,128,1,16,power_law_1.2,0.5082623958587646
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,2048,768,8,128,2,8,power_law_1.01,0.030559998750686646
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,2048,768,8,128,2,8,balanced,0.06246933341026306
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,2048,768,8,128,2,8,balanced,0.0650079995393753
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,2048,768,8,128,1,16,power_law_1.2,0.8815936088562012
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,2048,768,8,128,2,8,power_law_1.01,0.032492798566818235
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,2048,768,8,128,2,8,balanced,0.025253333151340485
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,2048,768,8,128,1,16,power_law_1.2,0.9726400375366211
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,2048,768,8,128,2,8,balanced,0.06989333530267079
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,2048,768,8,128,2,8,balanced,0.06915733218193054
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,2048,768,8,128,2,8,power_law_1.01,0.040294399857521056
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,2048,768,8,128,2,8,power_law_1.01,0.035769599676132205
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,2048,768,8,128,2,8,balanced,0.026399999856948853
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,2048,768,8,128,1,16,power_law_1.2,1.4582655906677247
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,2048,768,8,128,2,8,power_law_1.01,0.04159359931945801
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,2048,768,8,128,2,8,balanced,0.0831520011027654
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,2048,768,8,128,2,8,balanced,0.02717866748571396
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,2048,768,8,128,2,8,power_law_1.01,0.031673601269721983
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,2048,768,8,128,2,8,balanced,0.08054399987061818
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,2048,768,8,128,1,16,power_law_1.2,2.41146240234375
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,2048,768,8,128,2,8,power_law_1.01,0.04190720021724701
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,2048,768,8,128,2,8,power_law_1.01,0.03036159873008728
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,2048,768,8,128,2,8,balanced,0.029557332396507263
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,2048,768,8,128,2,8,power_law_1.01,0.04408319890499115
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,2048,768,8,128,1,16,power_law_1.2,4.973708724975586
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,2048,768,8,128,2,8,balanced,0.10053333640098572
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,2048,768,8,128,2,8,balanced,0.03381866713364919
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,2048,768,8,128,2,8,power_law_1.01,0.03296000063419342
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,2048,768,8,128,2,8,balanced,0.09407466650009155
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,2048,768,8,128,2,8,power_law_1.01,0.043968001008033754
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,2048,768,8,128,2,8,power_law_1.01,0.0359935998916626
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,2048,768,8,128,2,8,balanced,0.03461333364248276
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,2048,768,8,128,2,8,power_law_1.01,0.04797439873218536
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,2048,768,8,128,2,8,balanced,0.0349440003434817
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,2048,768,8,128,2,8,power_law_1.01,0.0385343998670578
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,2048,768,8,128,2,8,balanced,0.11211733023325603
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,2048,768,8,128,2,8,power_law_1.01,0.04853120148181915
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,2048,768,8,128,2,8,balanced,0.099973330895106
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,2048,768,8,128,2,8,balanced,0.03488533447186152
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,2048,768,8,128,2,8,power_law_1.01,0.03873920142650604
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,2048,768,8,128,2,8,power_law_1.01,0.049446401000022885
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,2048,768,8,128,2,8,balanced,0.035573333501815796
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,2048,768,8,128,2,8,power_law_1.01,0.03916800022125244
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,2048,768,8,128,2,8,power_law_1.01,0.20265600681304932
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,2048,768,8,128,2,8,balanced,0.03653866549332937
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,2048,768,8,128,2,8,balanced,0.1571466624736786
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,2048,768,8,128,2,8,power_law_1.01,0.4323584079742432
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,2048,768,8,128,2,8,power_law_1.01,0.03986560106277466
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,2048,768,8,128,2,8,balanced,0.14403200149536133
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,2048,768,8,128,2,8,balanced,0.0364533339937528
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,2048,768,8,128,2,8,power_law_1.01,0.43288960456848147
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,2048,768,8,128,2,8,power_law_1.01,0.04105600118637085
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,2048,768,8,128,2,8,power_law_1.01,0.06652799844741822
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,2048,768,8,128,2,8,balanced,0.03734933336575826
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,2048,768,8,128,2,8,power_law_1.01,0.04184960126876831
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,2048,768,8,128,2,8,power_law_1.01,0.07425280213356018
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,2048,768,8,128,2,8,power_law_1.01,0.045900800824165346
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,2048,768,8,128,2,8,balanced,0.03825599948565165
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,2048,768,8,128,2,8,balanced,0.1902773380279541
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,2048,768,8,128,2,8,power_law_1.01,0.07712000012397766
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,2048,768,8,128,2,8,power_law_1.01,0.04888319969177246
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,2048,768,8,128,2,8,balanced,0.039408000806967415
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,2048,768,8,128,2,8,balanced,0.16476266582806906
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,2048,768,8,128,2,8,power_law_1.01,0.08985599875450134
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,2048,768,8,128,2,8,power_law_1.01,0.04847359955310822
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,2048,768,8,128,2,8,power_law_1.01,0.10998400449752807
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,2048,768,8,128,2,8,power_law_1.01,0.05432320237159729
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,2048,768,8,128,2,8,power_law_1.01,0.05532159805297852
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,2048,768,8,128,2,8,power_law_1.01,0.1422271966934204
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,2048,768,8,128,2,8,power_law_1.01,0.05915520191192627
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,2048,768,8,128,2,8,power_law_1.01,0.15219839811325073
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,2048,768,8,128,2,8,balanced,0.044735997915267944
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,2048,768,8,128,2,8,balanced,0.2749226689338684
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,2048,768,8,128,2,8,power_law_1.01,0.06959999799728393
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,2048,768,8,128,2,8,power_law_1.01,0.20035200119018554
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,2048,768,8,128,2,8,balanced,0.04562666515509287
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,2048,768,8,128,2,8,balanced,0.2338506579399109
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,2048,768,8,128,2,8,power_law_1.01,0.07635200023651123
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,2048,768,8,128,2,8,power_law_1.01,0.22707200050354004
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,2048,768,8,128,2,8,power_law_1.01,0.08952320218086243
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,2048,768,8,128,2,8,power_law_1.01,0.34673919677734377
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,2048,768,8,128,2,8,power_law_1.01,0.10282880067825317
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,2048,768,8,128,2,8,power_law_1.01,0.39292159080505373
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,2048,768,8,128,2,8,power_law_1.01,0.13734400272369385
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,2048,768,8,128,2,8,power_law_1.01,0.5540224075317383
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,2048,768,8,128,2,8,power_law_1.01,0.14918400049209596
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,2048,768,8,128,2,8,balanced,0.052144000927607216
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,2048,768,8,128,2,8,power_law_1.01,0.8260928153991699
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,2048,768,8,128,2,8,power_law_1.01,0.19957760572433472
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,2048,768,8,128,2,8,balanced,0.3492106596628825
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,2048,768,8,128,2,8,balanced,0.0609386662642161
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,2048,768,8,128,2,8,balanced,0.2786666750907898
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,2048,768,8,128,2,8,power_law_1.01,0.28436479568481443
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,2048,768,8,128,2,8,power_law_1.01,1.7814592361450194
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,2048,768,8,128,2,8,balanced,0.06373333434263866
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,2048,768,8,128,2,8,power_law_1.01,0.41224961280822753
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,2048,768,8,128,2,8,power_law_1.01,0.5128320217132568
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,2048,768,8,128,2,8,power_law_1.01,0.6421247959136963
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,2048,768,8,128,2,8,balanced,0.07904533545176189
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,2048,768,8,128,2,8,power_law_1.01,0.9359359741210938
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,2048,768,8,128,2,8,balanced,0.08797333637873332
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,2048,768,8,128,2,8,power_law_1.01,2.1004159927368162
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,2048,768,8,128,2,8,balanced,0.43640534083048504
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,2048,768,8,128,2,8,balanced,0.35339200496673584
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,2048,768,8,128,2,8,balanced,0.11901332934697469
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,2048,768,8,128,2,8,balanced,0.13662933309872946
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,2048,768,8,128,2,8,balanced,0.19751467307408652
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,2048,768,8,128,2,8,power_law_1.2,0.0274944007396698
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,2048,768,8,128,2,8,power_law_1.2,0.02632960081100464
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,2048,768,8,128,2,8,balanced,0.26843732595443726
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,2048,768,8,128,2,8,power_law_1.01,0.028384000062942505
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,2048,768,8,128,2,8,power_law_1.2,0.026867198944091796
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,2048,768,8,128,2,8,balanced,0.6785919666290283
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,2048,768,8,128,2,8,power_law_1.2,0.030700799822807313
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,2048,768,8,128,2,8,power_law_1.01,0.02627840042114258
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,2048,768,8,128,2,8,balanced,0.52456001440684
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,2048,768,8,128,2,8,power_law_1.2,0.03246079981327057
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,2048,768,8,128,2,8,power_law_1.01,0.026649600267410277
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,2048,768,8,128,2,8,power_law_1.2,0.04023680090904236
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,2048,768,8,128,2,8,power_law_1.01,0.031488001346588135
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,2048,768,8,128,2,8,power_law_1.2,0.041305598616600034
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,2048,768,8,128,2,8,power_law_1.01,0.03173120021820068
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,2048,768,8,128,2,8,balanced,0.3909440040588379
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,2048,768,8,128,2,8,power_law_1.2,0.0441536009311676
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,2048,768,8,128,2,8,power_law_1.01,0.03432320058345795
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,2048,768,8,128,2,8,power_law_1.2,0.04382719993591309
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,2048,768,8,128,2,8,power_law_1.01,0.0349375993013382
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,2048,768,8,128,2,8,power_law_1.01,0.035897600650787356
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,2048,768,8,128,2,8,power_law_1.2,0.04601599872112274
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,2048,768,8,128,2,8,power_law_1.01,0.0381632000207901
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,2048,768,8,128,2,8,power_law_1.2,0.04978559911251068
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,2048,768,8,128,2,8,power_law_1.01,0.03903999924659729
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,2048,768,8,128,2,8,power_law_1.2,0.05095679759979248
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,2048,768,8,128,2,8,power_law_1.01,0.04245760142803192
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,2048,768,8,128,2,8,power_law_1.2,0.04902400076389313
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,2048,768,8,128,2,8,power_law_1.01,0.04529919922351837
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,2048,768,8,128,2,8,power_law_1.2,0.430790376663208
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,2048,768,8,128,2,8,balanced,0.5040853420893351
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,2048,768,8,128,2,8,power_law_1.01,0.04733439981937408
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,2048,768,8,128,2,8,power_law_1.2,0.4337920188903809
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,2048,768,8,128,2,8,power_law_1.01,0.051712000370025636
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,2048,768,8,128,2,8,power_law_1.2,0.43301119804382326
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,2048,768,8,128,2,8,power_law_1.2,0.06999040246009827
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,2048,768,8,128,2,8,power_law_1.2,0.07663360238075256
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,2048,768,8,128,2,8,power_law_1.01,0.05572479963302612
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,2048,768,8,128,2,8,power_law_1.2,0.08611840009689331
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,2048,768,8,128,2,8,power_law_1.01,0.05934079885482788
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,2048,768,8,128,2,8,power_law_1.2,0.09411839842796325
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,2048,768,8,128,2,8,power_law_1.2,0.13089920282363893
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,2048,768,8,128,2,8,power_law_1.2,0.1553984045982361
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,2048,768,8,128,2,8,power_law_1.01,0.06506879925727845
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,2048,768,8,128,2,8,power_law_1.2,0.17260160446166992
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,2048,768,8,128,2,8,balanced,0.6275573174158732
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,2048,768,8,128,2,8,power_law_1.01,0.07252479791641235
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,2048,768,8,128,2,8,power_law_1.2,0.25128319263458254
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,2048,768,8,128,2,8,power_law_1.01,0.08730239868164062
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,2048,768,8,128,2,8,power_law_1.2,0.2882623910903931
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,2048,768,8,128,2,8,power_law_1.2,0.4438464164733887
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,2048,768,8,128,2,8,power_law_1.01,0.09777920246124268
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,2048,768,8,128,2,8,power_law_1.2,0.5600959777832031
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,2048,768,8,128,2,8,power_law_1.01,0.12774399518966675
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,2048,768,8,128,2,8,balanced,1.2912639776865642
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,2048,768,8,128,2,8,power_law_1.2,0.754099178314209
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,2048,768,8,128,2,8,power_law_1.01,0.1698367953300476
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,2048,768,8,128,2,8,balanced,0.9981493155161539
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,2048,768,8,128,2,8,power_law_1.2,1.1271743774414062
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,2048,768,8,128,2,8,power_law_1.01,0.22987520694732666
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,2048,768,8,128,2,8,power_law_1.01,0.29473280906677246
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,2048,768,8,128,2,8,power_law_1.2,3.297280120849609
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,2048,768,8,128,2,8,power_law_1.01,0.49414401054382323
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,2048,768,8,128,2,8,power_law_1.01,0.7068096160888672
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,2048,768,8,128,2,8,power_law_1.2,0.035795199871063235
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,2048,768,8,128,2,8,power_law_1.01,0.8134336471557617
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,2048,768,8,128,2,8,power_law_1.2,0.030777600407600404
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,2048,768,8,128,2,8,balanced,0.9854880174001058
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,2048,768,8,128,2,8,power_law_1.2,0.03036159873008728
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,2048,768,8,128,2,8,power_law_1.01,1.1875455856323243
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,2048,768,8,128,2,8,power_law_1.2,0.03387520015239716
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,2048,768,8,128,2,8,power_law_1.2,0.03651840090751648
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,2048,768,8,128,2,8,power_law_1.01,1.7572032928466796
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,2048,768,8,128,2,8,power_law_1.2,0.038438400626182555
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,2048,768,8,128,2,8,power_law_1.2,0.037964800000190736
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,2048,768,8,128,2,8,power_law_1.2,0.03997440040111542
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,2048,768,8,128,2,8,power_law_1.01,3.2094593048095703
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,2048,768,8,128,2,8,power_law_1.2,0.04037120044231415
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,2048,768,8,128,2,8,power_law_1.2,0.04113920032978058
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,2048,768,8,128,2,8,power_law_1.2,0.04474239945411682
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,2048,768,8,128,2,8,power_law_1.2,0.04901759922504425
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,2048,768,8,128,2,8,power_law_1.2,0.050470399856567386
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,2048,768,8,128,2,8,power_law_1.2,0.0506879985332489
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,2048,768,8,128,2,8,power_law_1.2,0.05630080103874206
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,2048,768,8,128,2,8,power_law_1.2,0.05868800282478333
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,2048,768,8,128,2,8,power_law_1.2,0.060844802856445314
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,2048,768,8,128,2,8,power_law_1.2,0.07128959894180298
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,2048,768,8,128,2,8,power_law_1.2,0.08347520232200623
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,2048,768,8,128,2,8,power_law_1.2,0.0920639991760254
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,2048,768,8,128,2,8,power_law_1.2,0.11285760402679443
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,2048,768,8,128,2,8,power_law_1.2,0.14466559886932373
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,2048,768,8,128,2,8,power_law_1.2,0.16915199756622315
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,2048,768,8,128,2,8,power_law_1.2,0.25528318881988527
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,2048,768,8,128,2,8,power_law_1.2,0.30202879905700686
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,2048,768,8,128,2,8,power_law_1.2,0.4996479988098145
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,2048,768,8,128,2,8,power_law_1.2,0.6658112049102783
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,2048,768,8,128,2,8,power_law_1.2,0.8180992126464843
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,2048,768,8,128,2,8,power_law_1.2,1.2411968231201171
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,2048,768,8,128,2,8,power_law_1.2,3.0483072280883787
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,2048,768,8,128,2,8,power_law_1.2,0.028787198662757873
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,2048,768,8,128,2,8,balanced,1.9277547200520833
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,2048,768,8,128,2,8,power_law_1.2,0.02656640112400055
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,2048,768,8,128,2,8,power_law_1.2,0.026995199918746948
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,2048,768,8,128,4,4,balanced,0.023183998962243397
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,2048,768,8,128,2,8,power_law_1.2,0.030399999022483824
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,2048,768,8,128,4,4,balanced,0.023381332556406658
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,2048,768,8,128,2,8,power_law_1.2,0.0318336009979248
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,2048,768,8,128,4,4,balanced,0.025066666305065155
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,2048,768,8,128,2,8,power_law_1.2,0.03503359854221344
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,2048,768,8,128,4,4,balanced,0.0290133332212766
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,2048,768,8,128,2,8,power_law_1.2,0.035417601466178894
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,2048,768,8,128,4,4,balanced,0.04309333364168803
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,2048,768,8,128,2,8,power_law_1.2,0.037894400954246524
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,2048,768,8,128,4,4,balanced,0.04432533184687296
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,2048,768,8,128,4,4,balanced,0.0461760014295578
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,2048,768,8,128,2,8,power_law_1.2,0.03715839982032776
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,2048,768,8,128,4,4,balanced,0.04544533292452494
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,2048,768,8,128,2,8,power_law_1.2,0.04115839898586273
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,2048,768,8,128,4,4,balanced,0.045007998744646706
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,2048,768,8,128,2,8,power_law_1.2,0.04330880045890808
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,2048,768,8,128,4,4,balanced,0.04572799801826477
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,2048,768,8,128,2,8,power_law_1.2,0.04645760059356689
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,2048,768,8,128,4,4,balanced,0.04603200157483419
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,2048,768,8,128,2,8,power_law_1.2,0.04707199931144714
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,2048,768,8,128,4,4,balanced,0.04665599763393402
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,2048,768,8,128,2,8,power_law_1.2,0.05436800122261047
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,2048,768,8,128,4,4,balanced,0.04731733103593191
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,2048,768,8,128,4,4,balanced,0.048570667703946434
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,2048,768,8,128,2,8,power_law_1.2,0.06023039817810059
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,2048,768,8,128,4,4,balanced,0.053690666953722634
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,2048,768,8,128,2,8,power_law_1.2,0.05910400152206421
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,2048,768,8,128,4,4,balanced,0.0540533314148585
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,2048,768,8,128,4,4,balanced,0.05763733386993408
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,2048,768,8,128,2,8,power_law_1.2,0.06833919882774353
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,2048,768,8,128,4,4,balanced,0.06401599943637848
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,2048,768,8,128,2,8,power_law_1.2,0.07586560249328614
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,2048,768,8,128,4,4,balanced,0.07126399874687195
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,2048,768,8,128,2,8,power_law_1.2,0.09712640047073365
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,2048,768,8,128,4,4,balanced,0.09136533737182617
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,2048,768,8,128,2,8,power_law_1.2,0.11109119653701782
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,2048,768,8,128,4,4,balanced,0.08933867017428081
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,2048,768,8,128,2,8,power_law_1.2,0.12803200483322144
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,2048,768,8,128,2,8,power_law_1.2,0.18643840551376342
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,2048,768,8,128,2,8,power_law_1.2,0.2541887998580933
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,2048,768,8,128,4,4,balanced,0.12748266259829202
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,2048,768,8,128,2,8,power_law_1.2,0.3720128059387207
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,2048,768,8,128,2,8,power_law_1.2,0.4907008171081543
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,2048,768,8,128,2,8,power_law_1.2,0.7727104187011719
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,2048,768,8,128,4,4,balanced,0.1304800013701121
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,2048,768,8,128,2,8,power_law_1.2,0.9602815628051757
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,2048,768,8,128,2,8,power_law_1.2,1.4079615592956543
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,2048,768,8,128,4,4,balanced,0.17732266585032144
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,2048,768,8,128,2,8,power_law_1.2,2.5044288635253906
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,2048,768,8,128,2,8,power_law_1.2,4.269267272949219
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,2048,768,8,128,4,4,balanced,0.2271733283996582
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,2048,768,8,128,4,4,balanced,0.33084267377853394
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,2048,768,8,128,4,4,balanced,0.03146133323510488
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,2048,768,8,128,4,4,balanced,0.031285333136717476
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,2048,768,8,128,4,4,balanced,0.03190933416287104
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,2048,768,8,128,4,4,power_law_1.01,0.025670400261878966
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,2048,768,8,128,4,4,balanced,0.035674666364987694
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,2048,768,8,128,4,4,balanced,0.04214400053024292
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,2048,768,8,128,4,4,power_law_1.01,0.025011199712753295
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,2048,768,8,128,4,4,balanced,0.041402667760849
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,2048,768,8,128,4,4,power_law_1.01,0.02656640112400055
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,2048,768,8,128,4,4,balanced,0.04227200150489807
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,2048,768,8,128,4,4,balanced,0.4255359967549642
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,2048,768,8,128,4,4,power_law_1.01,0.030368000268936157
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,2048,768,8,128,4,4,power_law_1.01,0.03364480137825012
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,2048,768,8,128,4,4,balanced,0.0425546665986379
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,2048,768,8,128,4,4,power_law_1.01,0.035148799419403076
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,2048,768,8,128,4,4,balanced,0.0414986660083135
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,2048,768,8,128,4,4,power_law_1.01,0.029996800422668456
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,2048,768,8,128,4,4,balanced,0.030042665700117748
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,2048,768,8,128,4,4,power_law_1.01,0.042054399847984314
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,2048,768,8,128,4,4,balanced,0.0425600012143453
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,2048,768,8,128,4,4,power_law_1.01,0.030611199140548707
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,2048,768,8,128,4,4,balanced,0.03141866624355316
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,2048,768,8,128,4,4,power_law_1.01,0.044710400700569156
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,2048,768,8,128,4,4,balanced,0.04283200204372406
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,2048,768,8,128,4,4,power_law_1.01,0.03375999927520752
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,2048,768,8,128,4,4,balanced,0.031925333042939506
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,2048,768,8,128,4,4,power_law_1.01,0.04549759924411774
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,2048,768,8,128,4,4,balanced,0.035002666215101876
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,2048,768,8,128,4,4,balanced,0.043162668744723
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,2048,768,8,128,4,4,power_law_1.01,0.036774399876594546
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,2048,768,8,128,4,4,power_law_1.01,0.04625279903411865
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,2048,768,8,128,4,4,balanced,0.03957866628964742
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,2048,768,8,128,4,4,balanced,0.04533866544564565
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,2048,768,8,128,4,4,power_law_1.01,0.040454399585723874
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,2048,768,8,128,4,4,power_law_1.01,0.04733439981937408
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,2048,768,8,128,4,4,balanced,0.04084266722202301
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,2048,768,8,128,4,4,power_law_1.01,0.041465601325035094
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,2048,768,8,128,4,4,balanced,0.04598933458328247
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,2048,768,8,128,4,4,power_law_1.01,0.050988799333572386
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,2048,768,8,128,4,4,balanced,0.04146666576464971
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,2048,768,8,128,4,4,power_law_1.01,0.04200960099697113
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,2048,768,8,128,4,4,balanced,0.052202666799227394
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,2048,768,8,128,4,4,power_law_1.01,0.05343359708786011
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,2048,768,8,128,4,4,balanced,0.041834667325019836
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,2048,768,8,128,4,4,balanced,0.5336586634318033
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,2048,768,8,128,4,4,power_law_1.01,0.04172160029411316
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,2048,768,8,128,4,4,power_law_1.01,0.05379840135574341
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,2048,768,8,128,4,4,balanced,0.05273066461086273
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,2048,768,8,128,4,4,balanced,0.04228266576925913
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,2048,768,8,128,4,4,power_law_1.01,0.04255360066890716
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,2048,768,8,128,4,4,power_law_1.01,0.4327104091644287
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,2048,768,8,128,4,4,balanced,0.058880001306533813
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,2048,768,8,128,4,4,balanced,0.04349866509437561
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,2048,768,8,128,4,4,power_law_1.01,0.045286399126052854
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,2048,768,8,128,4,4,power_law_1.01,0.43534078598022463
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,2048,768,8,128,4,4,balanced,0.043280000487963356
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,2048,768,8,128,4,4,balanced,0.06670933465162913
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,2048,768,8,128,4,4,power_law_1.01,0.04885759949684143
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,2048,768,8,128,4,4,power_law_1.01,0.44039039611816405
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,2048,768,8,128,4,4,balanced,0.04568533102671305
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,2048,768,8,128,4,4,power_law_1.01,0.05129600167274475
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,2048,768,8,128,4,4,balanced,0.07286400099595387
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,2048,768,8,128,4,4,power_law_1.01,0.44037761688232424
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,2048,768,8,128,4,4,balanced,0.04765866696834564
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,2048,768,8,128,4,4,power_law_1.01,0.050271999835968015
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,2048,768,8,128,4,4,power_law_1.01,0.44464640617370604
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,2048,768,8,128,4,4,balanced,0.08392000198364258
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,2048,768,8,128,4,4,balanced,0.0491839994986852
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,2048,768,8,128,4,4,power_law_1.01,0.05824000239372253
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,2048,768,8,128,4,4,power_law_1.01,0.09128320217132568
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,2048,768,8,128,4,4,power_law_1.01,0.06218240261077881
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,2048,768,8,128,4,4,balanced,0.09702933828035991
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,2048,768,8,128,4,4,power_law_1.01,0.10615040063858032
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,2048,768,8,128,4,4,power_law_1.01,0.06721919775009155
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,2048,768,8,128,4,4,power_law_1.01,0.12042239904403687
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,2048,768,8,128,4,4,power_law_1.01,0.07957119941711426
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,2048,768,8,128,4,4,balanced,0.12930132945378622
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,2048,768,8,128,4,4,balanced,0.05754133562246958
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,2048,768,8,128,4,4,power_law_1.01,0.14755200147628783
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,2048,768,8,128,4,4,power_law_1.01,0.08370559811592101
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,2048,768,8,128,4,4,power_law_1.01,0.17633919715881347
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,2048,768,8,128,4,4,balanced,0.06022400160630544
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,2048,768,8,128,4,4,power_law_1.01,0.10673919916152955
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,2048,768,8,128,4,4,power_law_1.01,0.22961280345916749
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,2048,768,8,128,4,4,power_law_1.01,0.12056959867477417
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,2048,768,8,128,4,4,balanced,0.15026133259137472
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,2048,768,8,128,4,4,power_law_1.2,0.025228801369667053
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,2048,768,8,128,4,4,balanced,0.8224213123321533
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,2048,768,8,128,4,4,power_law_1.01,0.15418879985809325
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,2048,768,8,128,4,4,power_law_1.01,0.2763711929321289
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,2048,768,8,128,4,4,power_law_1.2,0.024537600576877594
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,2048,768,8,128,4,4,power_law_1.01,0.18081920146942138
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,2048,768,8,128,4,4,power_law_1.01,0.4010623931884766
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,2048,768,8,128,4,4,power_law_1.2,0.026316800713539125
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,2048,768,8,128,4,4,power_law_1.01,0.2565119981765747
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,2048,768,8,128,4,4,balanced,0.20900267362594604
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,2048,768,8,128,4,4,power_law_1.01,0.5945792198181152
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,2048,768,8,128,4,4,balanced,0.0670773337284724
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,2048,768,8,128,4,4,power_law_1.01,0.03081600069999695
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,2048,768,8,128,4,4,power_law_1.2,0.030355200171470642
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,2048,768,8,128,4,4,power_law_1.01,0.33244800567626953
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,2048,768,8,128,4,4,power_law_1.01,0.653875207901001
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,2048,768,8,128,4,4,power_law_1.01,0.03115519881248474
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,2048,768,8,128,4,4,balanced,0.08067200084527333
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,2048,768,8,128,4,4,power_law_1.2,0.033670398592948916
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,2048,768,8,128,4,4,power_law_1.01,0.5304959774017334
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,2048,768,8,128,4,4,power_law_1.01,0.031590399146080014
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,2048,768,8,128,4,4,power_law_1.01,1.000096035003662
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,2048,768,8,128,4,4,power_law_1.2,0.04306559860706329
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,2048,768,8,128,4,4,balanced,0.08455999692281087
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,2048,768,8,128,4,4,power_law_1.01,0.036032000184059144
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,2048,768,8,128,4,4,power_law_1.01,0.7290239810943604
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,2048,768,8,128,4,4,power_law_1.2,0.044352000951766966
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,2048,768,8,128,4,4,balanced,0.26523733139038086
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,2048,768,8,128,4,4,power_law_1.01,0.03835520148277283
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,2048,768,8,128,4,4,power_law_1.01,2.263225555419922
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,2048,768,8,128,4,4,power_law_1.2,0.045664000511169436
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,2048,768,8,128,4,4,power_law_1.01,0.8829376220703125
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,2048,768,8,128,4,4,power_law_1.01,0.04166400134563446
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,2048,768,8,128,4,4,power_law_1.01,0.042483198642730716
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,2048,768,8,128,4,4,power_law_1.2,0.04642559885978699
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,2048,768,8,128,4,4,power_law_1.01,1.264633560180664
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,2048,768,8,128,4,4,power_law_1.01,0.043968001008033754
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,2048,768,8,128,4,4,power_law_1.2,0.047251200675964354
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,2048,768,8,128,4,4,balanced,0.10962667067845662
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,2048,768,8,128,4,4,power_law_1.01,0.044377601146698
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,2048,768,8,128,4,4,power_law_1.01,0.04686720073223114
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,2048,768,8,128,4,4,power_law_1.01,2.604812812805176
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,2048,768,8,128,4,4,power_law_1.2,0.05149440169334411
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,2048,768,8,128,4,4,power_law_1.01,0.04924800097942352
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,2048,768,8,128,4,4,balanced,0.1236853301525116
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,2048,768,8,128,4,4,power_law_1.2,0.20583679676055908
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,2048,768,8,128,4,4,power_law_1.01,0.05435519814491272
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,2048,768,8,128,4,4,balanced,0.4044959942499797
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,2048,768,8,128,4,4,power_law_1.01,0.05464320182800293
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,2048,768,8,128,4,4,power_law_1.2,0.3558464050292969
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,2048,768,8,128,4,4,power_law_1.01,0.0636672019958496
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,2048,768,8,128,4,4,balanced,0.18172800540924072
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,2048,768,8,128,4,4,power_law_1.2,0.43415679931640627
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,2048,768,8,128,4,4,power_law_1.2,0.43674240112304685
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,2048,768,8,128,4,4,power_law_1.01,0.06960639953613282
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,2048,768,8,128,4,4,power_law_1.2,0.4381120204925537
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,2048,768,8,128,4,4,balanced,0.23656533161799112
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,2048,768,8,128,4,4,power_law_1.01,0.07393919825553893
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,2048,768,8,128,4,4,power_law_1.2,0.43912320137023925
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,2048,768,8,128,4,4,power_law_1.01,0.07828480005264282
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,2048,768,8,128,4,4,power_law_1.2,0.4476480007171631
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,2048,768,8,128,4,4,balanced,0.5330026547114054
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,2048,768,8,128,4,4,balanced,0.3394240140914917
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,2048,768,8,128,4,4,power_law_1.01,0.0932416021823883
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,2048,768,8,128,4,4,power_law_1.2,0.09122560024261475
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,2048,768,8,128,4,4,power_law_1.01,0.1067199945449829
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,2048,768,8,128,4,4,power_law_1.2,0.11884160041809082
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,2048,768,8,128,4,4,power_law_1.2,0.12602239847183228
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,2048,768,8,128,4,4,power_law_1.01,0.1324928045272827
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,2048,768,8,128,4,4,power_law_1.2,0.15311360359191895
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,2048,768,8,128,4,4,power_law_1.01,0.1713536024093628
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,2048,768,8,128,4,4,power_law_1.2,0.17583359479904176
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,2048,768,8,128,4,4,balanced,0.4364480177561442
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,2048,768,8,128,4,4,power_law_1.01,0.24566400051116943
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,2048,768,8,128,4,4,power_law_1.2,0.24389119148254396
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,2048,768,8,128,4,4,power_law_1.01,0.32836480140686036
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,2048,768,8,128,4,4,power_law_1.2,0.31623039245605467
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,2048,768,8,128,4,4,balanced,1.5645866394042969
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,2048,768,8,128,4,4,power_law_1.01,0.4447616100311279
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,2048,768,8,128,4,4,power_law_1.2,0.4993855953216553
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,2048,768,8,128,4,4,power_law_1.01,0.5192128181457519
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,2048,768,8,128,4,4,power_law_1.01,0.8264703750610352
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,2048,768,8,128,4,4,power_law_1.2,0.6552127838134766
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,2048,768,8,128,4,4,balanced,0.6690080165863037
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,2048,768,8,128,4,4,power_law_1.01,1.1211968421936036
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,2048,768,8,128,4,4,power_law_1.2,0.7635072231292724
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,2048,768,8,128,4,4,power_law_1.01,1.4027071952819825
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,2048,768,8,128,4,4,balanced,0.6404426495234171
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,2048,768,8,128,4,4,power_law_1.2,1.3480768203735352
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,2048,768,8,128,4,4,power_law_1.01,2.4935359954833984
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,2048,768,8,128,4,4,power_law_1.2,2.91473274230957
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,2048,768,8,128,4,4,power_law_1.01,4.441388702392578
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,2048,768,8,128,4,4,power_law_1.2,0.03415040075778961
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,2048,768,8,128,4,4,power_law_1.2,0.029894399642944335
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,2048,768,8,128,4,4,power_law_1.2,0.03126400113105774
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,2048,768,8,128,4,4,balanced,0.8361226717631022
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,2048,768,8,128,4,4,power_law_1.2,0.03437440097332001
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,2048,768,8,128,4,4,power_law_1.2,0.03601920008659363
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,2048,768,8,128,4,4,power_law_1.2,0.04002560079097748
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,2048,768,8,128,4,4,power_law_1.2,0.04172160029411316
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,2048,768,8,128,4,4,balanced,1.0583840211232503
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,2048,768,8,128,4,4,power_law_1.2,0.04230400025844574
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,2048,768,8,128,4,4,power_law_1.2,0.042342400550842284
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,2048,768,8,128,4,4,power_law_1.2,0.04444800019264221
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,2048,768,8,128,4,4,power_law_1.2,0.04648320078849792
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,2048,768,8,128,4,4,power_law_1.2,0.050783997774124144
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,2048,768,8,128,4,4,balanced,1.0392959912618
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,2048,768,8,128,4,4,power_law_1.2,0.04981119930744171
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,2048,768,8,128,4,4,power_law_1.2,0.05178239941596985
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,2048,768,8,128,4,4,power_law_1.2,0.05973759889602661
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,2048,768,8,128,4,4,power_law_1.2,0.06367999911308289
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,2048,768,8,128,4,4,power_law_1.2,0.06944640278816223
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,2048,768,8,128,4,4,power_law_1.2,0.08145279884338379
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,2048,768,8,128,4,4,power_law_1.2,0.09258239865303039
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,2048,768,8,128,4,4,power_law_1.2,0.10926719903945922
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,2048,768,8,128,4,4,power_law_1.2,0.12558079957962037
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,2048,768,8,128,4,4,power_law_1.2,0.1767807960510254
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,2048,768,8,128,4,4,power_law_1.2,0.1995200037956238
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,2048,768,8,128,4,4,power_law_1.2,0.30157439708709716
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,2048,768,8,128,4,4,power_law_1.2,0.40743041038513184
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,2048,768,8,128,4,4,power_law_1.2,0.6180031776428223
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,2048,768,8,128,4,4,power_law_1.2,0.7212736129760742
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,2048,768,8,128,4,4,balanced,1.648789405822754
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,2048,768,8,128,4,4,power_law_1.2,0.9685824394226075
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,2048,768,8,128,4,4,power_law_1.2,1.8513343811035157
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,2048,768,8,128,4,4,power_law_1.2,3.4445823669433593
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,2048,768,8,128,4,4,balanced,1.9917173385620117
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,2048,768,8,128,4,4,balanced,3.2464160919189453
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,4096,1536,8,128,1,16,balanced,0.04052799940109253
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,4096,1536,8,128,1,16,balanced,0.03818133225043615
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,4096,1536,8,128,1,16,balanced,0.04915733138720194
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,4096,1536,8,128,1,16,balanced,0.06482666730880737
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,2048,768,8,128,4,4,power_law_1.2,0.030976000428199767
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,4096,1536,8,128,1,16,balanced,0.09840533137321472
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,2048,768,8,128,4,4,power_law_1.2,0.0318015992641449
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,4096,1536,8,128,1,16,balanced,0.10071466366449992
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,2048,768,8,128,4,4,power_law_1.2,0.03192319869995117
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,4096,1536,8,128,1,16,balanced,0.10096533099810283
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,2048,768,8,128,4,4,power_law_1.2,0.03547520041465759
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,4096,1536,8,128,1,16,balanced,0.10003200173377991
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,4096,1536,8,128,1,16,balanced,0.10065600275993347
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,2048,768,8,128,4,4,power_law_1.2,0.03583360016345978
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,4096,1536,8,128,1,16,balanced,0.10083199540774028
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,2048,768,8,128,4,4,power_law_1.2,0.04222719967365265
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,4096,1536,8,128,1,16,balanced,0.10213866829872131
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,2048,768,8,128,4,4,power_law_1.2,0.042777600884437564
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,4096,1536,8,128,1,16,balanced,0.10276266932487488
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,2048,768,8,128,4,4,power_law_1.2,0.0438400000333786
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,4096,1536,8,128,1,16,balanced,0.1035040020942688
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,2048,768,8,128,4,4,power_law_1.2,0.04552960097789764
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,4096,1536,8,128,1,16,balanced,0.03996799886226654
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,4096,1536,8,128,1,16,balanced,0.10455999771753947
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,2048,768,8,128,4,4,power_law_1.2,0.046214398741722104
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,4096,1536,8,128,1,16,balanced,0.03655466685692469
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,4096,1536,8,128,1,16,balanced,0.11078400413195293
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,2048,768,8,128,4,4,power_law_1.2,0.05070719718933105
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,4096,1536,8,128,1,16,balanced,0.037050666908423104
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,4096,1536,8,128,1,16,balanced,0.11529599626859029
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,2048,768,8,128,4,4,power_law_1.2,0.053414398431777955
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,4096,1536,8,128,1,16,balanced,0.05107733110586802
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,4096,1536,8,128,1,16,balanced,0.11719999710718791
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,2048,768,8,128,4,4,power_law_1.2,0.057062399387359616
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,4096,1536,8,128,1,16,balanced,0.07053333520889282
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,2048,768,8,128,4,4,power_law_1.2,0.06488959789276123
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,4096,1536,8,128,1,16,balanced,0.12079999844233195
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,4096,1536,8,128,1,16,balanced,0.0713866651058197
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,4096,1536,8,128,1,16,balanced,0.12866666913032532
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,4096,1536,8,128,1,16,balanced,0.07189333438873291
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,4096,1536,8,128,1,16,power_law_1.01,0.09426559805870056
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,2048,768,8,128,4,4,power_law_1.2,0.07185919880867005
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,4096,1536,8,128,1,16,balanced,0.07291733225186665
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,4096,1536,8,128,1,16,balanced,0.13528000315030417
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,2048,768,8,128,4,4,power_law_1.2,0.07663360238075256
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,4096,1536,8,128,1,16,power_law_1.01,0.06437119841575623
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,4096,1536,8,128,1,16,balanced,0.0718560020128886
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,4096,1536,8,128,1,16,power_law_1.01,0.051520001888275144
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,4096,1536,8,128,1,16,balanced,0.15228799978892008
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,4096,1536,8,128,1,16,balanced,0.07344000041484833
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,4096,1536,8,128,1,16,power_law_1.01,0.06863359808921814
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,4096,1536,8,128,1,16,balanced,0.07336000104745229
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,2048,768,8,128,4,4,power_law_1.2,0.08044800162315369
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,4096,1536,8,128,1,16,power_law_1.01,0.0772607982158661
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,4096,1536,8,128,1,16,balanced,0.07406933108965556
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,4096,1536,8,128,1,16,balanced,0.18686934312184653
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,2048,768,8,128,4,4,power_law_1.2,0.09129599928855896
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,4096,1536,8,128,1,16,power_law_1.01,0.0972544014453888
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,4096,1536,8,128,1,16,balanced,0.07634666562080383
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,2048,768,8,128,4,4,power_law_1.2,0.10911999940872193
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,4096,1536,8,128,1,16,power_law_1.01,0.09537280201911927
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,4096,1536,8,128,1,16,balanced,0.07683733105659485
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,4096,1536,8,128,1,16,balanced,0.02906133234500885
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,4096,1536,8,128,1,16,balanced,0.19662932554880777
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,4096,1536,8,128,1,16,power_law_1.01,0.09656320214271545
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,4096,1536,8,128,1,16,balanced,0.081194669008255
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,2048,768,8,128,4,4,power_law_1.2,0.14376319646835328
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,4096,1536,8,128,1,16,balanced,0.029306667546431225
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,4096,1536,8,128,1,16,power_law_1.01,0.09729920029640197
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,4096,1536,8,128,1,16,balanced,0.0821973333756129
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,4096,1536,8,128,1,16,balanced,0.03200000027815501
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,4096,1536,8,128,1,16,power_law_1.01,0.10487040281295776
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,2048,768,8,128,4,4,power_law_1.2,0.16332800388336183
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,4096,1536,8,128,1,16,balanced,0.04635733366012573
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,4096,1536,8,128,1,16,power_law_1.01,0.10769280195236205
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,4096,1536,8,128,1,16,balanced,0.0858133335908254
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,2048,768,8,128,4,4,power_law_1.2,0.2965759992599487
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,4096,1536,8,128,1,16,balanced,0.26555200417836505
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,4096,1536,8,128,1,16,balanced,0.06502933303515117
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,4096,1536,8,128,1,16,power_law_1.01,0.110099196434021
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,2048,768,8,128,4,4,power_law_1.2,0.32119040489196776
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,4096,1536,8,128,1,16,balanced,0.09197866916656494
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,4096,1536,8,128,1,16,balanced,0.06589866677920024
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,4096,1536,8,128,1,16,power_law_1.01,0.12413439750671387
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,2048,768,8,128,4,4,power_law_1.2,0.558515214920044
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,4096,1536,8,128,1,16,balanced,0.06588799754778545
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,4096,1536,8,128,1,16,power_law_1.01,0.1205888032913208
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,4096,1536,8,128,1,16,balanced,0.09869866569836934
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,2048,768,8,128,4,4,power_law_1.2,0.6200064182281494
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,4096,1536,8,128,1,16,balanced,0.06648533542950948
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,4096,1536,8,128,1,16,power_law_1.01,0.12976640462875366
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,4096,1536,8,128,1,16,balanced,0.29154666264851886
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,4096,1536,8,128,1,16,balanced,0.1086346705754598
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,4096,1536,8,128,1,16,balanced,0.0673173318306605
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,4096,1536,8,128,1,16,power_law_1.01,0.1364799976348877
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,2048,768,8,128,4,4,power_law_1.2,0.9592576026916504
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,4096,1536,8,128,1,16,balanced,0.06898666421572368
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,4096,1536,8,128,1,16,power_law_1.01,0.13646080493927001
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,2048,768,8,128,4,4,power_law_1.2,1.203872013092041
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,4096,1536,8,128,1,16,balanced,0.12379733721415202
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,4096,1536,8,128,1,16,power_law_1.01,0.16542719602584838
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,4096,1536,8,128,1,16,balanced,0.06890666484832764
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,2048,768,8,128,4,4,power_law_1.2,1.694246482849121
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,4096,1536,8,128,1,16,power_law_1.01,0.1725119948387146
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,4096,1536,8,128,1,16,balanced,0.06966933111349742
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,4096,1536,8,128,1,16,balanced,0.15245866775512695
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,4096,1536,8,128,1,16,power_law_1.01,0.19751039743423462
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,4096,1536,8,128,1,16,balanced,0.07050133248170216
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,2048,768,8,128,4,4,power_law_1.2,2.565657615661621
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,4096,1536,8,128,1,16,balanced,0.4370719989140828
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,4096,1536,8,128,1,16,power_law_1.01,0.2483839988708496
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,4096,1536,8,128,1,16,balanced,0.07229333122571309
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,4096,1536,8,128,1,16,power_law_1.01,0.3189183950424194
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,2048,768,8,128,4,4,power_law_1.2,5.890911865234375
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,4096,1536,8,128,1,16,balanced,0.17460266749064127
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,4096,1536,8,128,1,16,power_law_1.01,0.4012288093566895
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,4096,1536,8,128,1,16,power_law_1.01,0.49936637878417967
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,4096,1536,8,128,1,16,balanced,0.07855466504891713
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,4096,1536,8,128,1,16,power_law_1.01,0.6189248085021972
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,4096,1536,8,128,1,16,balanced,0.2390186587969462
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,4096,1536,8,128,1,16,balanced,0.07904533545176189
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,4096,1536,8,128,1,16,power_law_1.01,0.9909695625305176
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,4096,1536,8,128,1,16,balanced,0.5366133451461792
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,4096,1536,8,128,1,16,power_law_1.01,1.1420351982116699
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,4096,1536,8,128,1,16,power_law_1.01,0.07274879813194275
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,4096,1536,8,128,1,16,power_law_1.01,1.2975168228149414
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,4096,1536,8,128,1,16,balanced,0.282970666885376
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,4096,1536,8,128,1,16,power_law_1.01,0.05723519921302796
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,4096,1536,8,128,1,16,power_law_1.01,2.193600082397461
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,4096,1536,8,128,1,16,power_law_1.01,0.046803200244903566
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,4096,1536,8,128,1,16,power_law_1.01,0.05559679865837097
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,4096,1536,8,128,1,16,power_law_1.01,4.439564895629883
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,4096,1536,8,128,1,16,power_law_1.01,0.05875840187072754
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,4096,1536,8,128,1,16,balanced,0.08366400003433228
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,4096,1536,8,128,1,16,power_law_1.01,0.06796159744262695
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,4096,1536,8,128,1,16,balanced,0.4147253433863322
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,4096,1536,8,128,1,16,balanced,0.09201066692670186
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,4096,1536,8,128,1,16,power_law_1.01,0.06946560144424438
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,4096,1536,8,128,1,16,balanced,0.6866666475931803
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,4096,1536,8,128,1,16,balanced,0.09521599610646565
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,4096,1536,8,128,1,16,power_law_1.01,0.07038080096244811
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,4096,1536,8,128,1,16,power_law_1.01,0.06425600051879883
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,4096,1536,8,128,1,16,power_law_1.01,0.07027199864387512
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,4096,1536,8,128,1,16,power_law_1.01,0.04222719967365265
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,4096,1536,8,128,1,16,power_law_1.01,0.07431679964065552
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,4096,1536,8,128,1,16,power_law_1.01,0.04071680009365082
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,4096,1536,8,128,1,16,power_law_1.01,0.04893440008163452
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,4096,1536,8,128,1,16,power_law_1.01,0.07719039916992188
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,4096,1536,8,128,1,16,balanced,0.11457066734631856
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,4096,1536,8,128,1,16,power_law_1.01,0.056428802013397214
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,4096,1536,8,128,1,16,power_law_1.01,0.08180480003356934
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,4096,1536,8,128,1,16,power_law_1.01,0.06378239989280701
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,4096,1536,8,128,1,16,balanced,0.5197173357009888
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,4096,1536,8,128,1,16,power_law_1.01,0.06554880142211914
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,4096,1536,8,128,1,16,power_law_1.01,0.08373759984970093
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,4096,1536,8,128,1,16,balanced,0.12463466326395671
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,4096,1536,8,128,1,16,power_law_1.01,0.06695680022239685
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,4096,1536,8,128,1,16,power_law_1.01,0.08376320004463196
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,4096,1536,8,128,1,16,power_law_1.01,0.06759679913520814
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,4096,1536,8,128,1,16,power_law_1.01,0.0930176019668579
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,4096,1536,8,128,1,16,balanced,0.17056532700856528
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,4096,1536,8,128,1,16,power_law_1.01,0.0713536024093628
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,4096,1536,8,128,1,16,power_law_1.01,0.0958079993724823
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,4096,1536,8,128,1,16,power_law_1.01,0.07735040187835693
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,4096,1536,8,128,1,16,power_law_1.01,0.09818239808082581
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,4096,1536,8,128,1,16,power_law_1.01,0.08036479949951172
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,4096,1536,8,128,1,16,power_law_1.01,0.08558080196380616
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,4096,1536,8,128,1,16,power_law_1.01,0.11546239852905274
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,4096,1536,8,128,1,16,balanced,0.19313067197799683
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,4096,1536,8,128,1,16,power_law_1.01,0.09482880234718323
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,4096,1536,8,128,1,16,power_law_1.01,0.13886079788208008
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,4096,1536,8,128,1,16,power_law_1.2,0.08967040181159973
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,4096,1536,8,128,1,16,power_law_1.01,0.150271999835968
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,4096,1536,8,128,1,16,power_law_1.2,0.0506879985332489
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,4096,1536,8,128,1,16,balanced,1.0366986592610676
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,4096,1536,8,128,1,16,power_law_1.01,0.10078719854354859
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,4096,1536,8,128,1,16,power_law_1.01,0.19780479669570922
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,4096,1536,8,128,1,16,power_law_1.2,0.05262719988822937
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,4096,1536,8,128,1,16,power_law_1.01,0.10263680219650269
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,4096,1536,8,128,1,16,balanced,0.6481226682662964
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,4096,1536,8,128,1,16,power_law_1.01,0.2757951974868774
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,4096,1536,8,128,1,16,power_law_1.2,0.06928640007972717
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,4096,1536,8,128,1,16,power_law_1.2,0.07020800113677979
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,4096,1536,8,128,1,16,power_law_1.01,0.28891520500183104
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,4096,1536,8,128,1,16,balanced,0.28650667270024616
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,4096,1536,8,128,1,16,power_law_1.01,0.10285439491271972
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,4096,1536,8,128,1,16,power_law_1.2,0.09492480158805847
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,4096,1536,8,128,1,16,power_law_1.01,0.1246783971786499
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,4096,1536,8,128,1,16,power_law_1.01,0.3971967935562134
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,4096,1536,8,128,1,16,power_law_1.01,0.15565439462661743
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,4096,1536,8,128,1,16,power_law_1.2,0.0932416021823883
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,4096,1536,8,128,1,16,power_law_1.01,0.48836479187011717
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,4096,1536,8,128,1,16,power_law_1.2,0.10221439599990845
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,4096,1536,8,128,1,16,power_law_1.01,0.17003519535064698
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,4096,1536,8,128,1,16,power_law_1.01,0.7937088012695312
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,4096,1536,8,128,1,16,power_law_1.01,0.2155776023864746
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,4096,1536,8,128,1,16,balanced,0.3707146644592285
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,4096,1536,8,128,1,16,power_law_1.2,0.10294400453567505
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,4096,1536,8,128,1,16,power_law_1.01,0.9215423583984375
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,4096,1536,8,128,1,16,power_law_1.01,0.33041279315948485
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,4096,1536,8,128,1,16,power_law_1.2,0.10362880229949951
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,4096,1536,8,128,1,16,power_law_1.01,0.4384255886077881
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,4096,1536,8,128,1,16,power_law_1.01,1.2074048042297363
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,4096,1536,8,128,1,16,power_law_1.2,0.10947200059890747
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,4096,1536,8,128,1,16,power_law_1.01,0.5644544124603271
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,4096,1536,8,128,1,16,power_law_1.2,0.11568000316619872
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,4096,1536,8,128,1,16,power_law_1.01,1.8721920013427735
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,4096,1536,8,128,1,16,power_law_1.01,0.7251711845397949
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,4096,1536,8,128,1,16,power_law_1.2,0.13086719512939454
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,4096,1536,8,128,1,16,power_law_1.01,1.159552001953125
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,4096,1536,8,128,1,16,power_law_1.2,0.12065919637680053
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,4096,1536,8,128,1,16,power_law_1.01,4.399699020385742
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,4096,1536,8,128,1,16,balanced,0.5485973358154297
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,4096,1536,8,128,1,16,power_law_1.01,1.5506879806518554
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,4096,1536,8,128,1,16,power_law_1.2,0.14223359823226928
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,4096,1536,8,128,1,16,power_law_1.01,1.8727359771728516
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,4096,1536,8,128,1,16,balanced,0.9840319951375326
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,4096,1536,8,128,1,16,power_law_1.2,0.1434048056602478
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,4096,1536,8,128,1,16,power_law_1.01,2.9259712219238283
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,4096,1536,8,128,1,16,power_law_1.2,0.1495743989944458
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,4096,1536,8,128,1,16,power_law_1.2,0.17112959623336793
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,4096,1536,8,128,1,16,power_law_1.01,7.286342620849609
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,4096,1536,8,128,1,16,power_law_1.2,0.18495999574661254
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,4096,1536,8,128,1,16,power_law_1.2,0.22383360862731932
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,4096,1536,8,128,1,16,balanced,0.7328000068664551
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,4096,1536,8,128,1,16,power_law_1.2,0.2959743976593018
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,4096,1536,8,128,1,16,power_law_1.2,0.38183040618896485
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,4096,1536,8,128,1,16,power_law_1.2,0.48643198013305666
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,4096,1536,8,128,1,16,power_law_1.2,0.6839871883392334
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,4096,1536,8,128,1,16,power_law_1.2,0.9674240112304687
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,4096,1536,8,128,1,16,balanced,2.018042723337809
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,4096,1536,8,128,1,16,power_law_1.2,1.1268416404724122
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,4096,1536,8,128,1,16,power_law_1.2,1.694438362121582
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,4096,1536,8,128,1,16,balanced,0.9155200322469076
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,4096,1536,8,128,1,16,power_law_1.2,2.3269439697265626
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,4096,1536,8,128,1,16,power_law_1.2,4.041203308105469
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,4096,1536,8,128,1,16,power_law_1.2,9.38760986328125
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,4096,1536,8,128,1,16,balanced,1.922357400258382
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,4096,1536,8,128,1,16,balanced,1.4436267217000325
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,4096,1536,8,128,1,16,power_law_1.2,0.06897280216217042
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,4096,1536,8,128,1,16,power_law_1.2,0.03919360041618347
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,4096,1536,8,128,1,16,power_law_1.2,0.043270400166511534
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,4096,1536,8,128,1,16,power_law_1.2,0.04880000054836273
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,4096,1536,8,128,1,16,power_law_1.2,0.053401601314544675
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,4096,1536,8,128,1,16,power_law_1.2,0.06885120272636414
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,4096,1536,8,128,1,16,power_law_1.2,0.07084800004959106
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,4096,1536,8,128,1,16,power_law_1.2,0.06965759992599488
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,4096,1536,8,128,1,16,power_law_1.2,0.07286400198936463
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,4096,1536,8,128,1,16,power_law_1.2,0.07191680073738098
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,4096,1536,8,128,1,16,power_law_1.2,0.06405119895935059
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,4096,1536,8,128,1,16,power_law_1.2,0.07954559922218322
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,4096,1536,8,128,1,16,power_law_1.2,0.08387839794158936
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,4096,1536,8,128,1,16,power_law_1.2,0.041920000314712526
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,4096,1536,8,128,1,16,power_law_1.2,0.08829439878463745
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,4096,1536,8,128,1,16,power_law_1.2,0.03873279988765717
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,4096,1536,8,128,1,16,power_law_1.2,0.08535040020942689
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,4096,1536,8,128,1,16,power_law_1.2,0.04644480049610138
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,4096,1536,8,128,1,16,power_law_1.2,0.09499520063400269
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,4096,1536,8,128,1,16,power_law_1.2,0.056415998935699464
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,4096,1536,8,128,1,16,balanced,2.829946517944336
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,4096,1536,8,128,1,16,power_law_1.2,0.0645632028579712
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,4096,1536,8,128,1,16,power_law_1.2,0.10937600135803223
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,4096,1536,8,128,1,16,power_law_1.2,0.06480000019073487
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,4096,1536,8,128,1,16,power_law_1.2,0.10474239587783814
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,4096,1536,8,128,1,16,power_law_1.2,0.12152320146560669
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,4096,1536,8,128,1,16,power_law_1.2,0.06718080043792725
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,4096,1536,8,128,1,16,power_law_1.2,0.13125760555267335
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,4096,1536,8,128,1,16,power_law_1.2,0.07162240147590637
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,4096,1536,8,128,1,16,power_law_1.2,0.16081279516220093
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,4096,1536,8,128,1,16,power_law_1.2,0.07304959893226623
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,4096,1536,8,128,1,16,power_law_1.2,0.20748798847198485
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,4096,1536,8,128,1,16,power_law_1.2,0.07927039861679078
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,4096,1536,8,128,1,16,power_law_1.2,0.29973759651184084
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,4096,1536,8,128,1,16,power_law_1.2,0.081004798412323
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,4096,1536,8,128,1,16,power_law_1.2,0.3311743974685669
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,4096,1536,8,128,1,16,power_law_1.2,0.08999680280685425
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,4096,1536,8,128,1,16,power_law_1.2,0.4564864158630371
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,4096,1536,8,128,1,16,power_law_1.2,0.7192383766174316
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,4096,1536,8,128,1,16,power_law_1.2,0.10415359735488891
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,4096,1536,8,128,1,16,power_law_1.2,0.9682304382324218
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,4096,1536,8,128,1,16,power_law_1.2,1.1805376052856444
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,4096,1536,8,128,1,16,power_law_1.2,0.10310399532318115
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,4096,1536,8,128,1,16,power_law_1.2,1.7167680740356446
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,4096,1536,8,128,1,16,power_law_1.2,0.11080960035324097
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,4096,1536,8,128,1,16,power_law_1.2,3.2913089752197267
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,4096,1536,8,128,1,16,power_law_1.2,0.12090239524841309
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,4096,1536,8,128,1,16,power_law_1.2,6.028409576416015
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,4096,1536,8,128,1,16,power_law_1.2,0.14915839433670045
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,4096,1536,8,128,2,8,balanced,0.037802666425704956
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,4096,1536,8,128,1,16,power_law_1.2,0.18264960050582885
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,4096,1536,8,128,2,8,balanced,0.037685332198937736
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,4096,1536,8,128,2,8,balanced,0.045968001087506614
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,4096,1536,8,128,1,16,power_law_1.2,0.2175679922103882
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,4096,1536,8,128,2,8,balanced,0.061706667145093284
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,4096,1536,8,128,1,16,power_law_1.2,0.27576959133148193
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,4096,1536,8,128,2,8,balanced,0.1058079997698466
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,4096,1536,8,128,1,16,power_law_1.2,0.4288640022277832
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,4096,1536,8,128,2,8,balanced,0.10169600447018941
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,4096,1536,8,128,1,16,power_law_1.2,0.5649343967437744
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,4096,1536,8,128,2,8,balanced,0.0339626669883728
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,4096,1536,8,128,2,8,balanced,0.10181867082913716
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,4096,1536,8,128,2,8,balanced,0.10130666693051656
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,4096,1536,8,128,2,8,balanced,0.033701332906881966
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,4096,1536,8,128,2,8,balanced,0.037077332536379494
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,4096,1536,8,128,1,16,power_law_1.2,0.8703104019165039
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,4096,1536,8,128,2,8,balanced,0.10170666376749675
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,4096,1536,8,128,2,8,balanced,0.10485866665840149
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,4096,1536,8,128,2,8,balanced,0.05153599878152212
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,4096,1536,8,128,1,16,power_law_1.2,1.2143360137939454
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,4096,1536,8,128,2,8,balanced,0.07366399963696797
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,4096,1536,8,128,2,8,balanced,0.10338667035102844
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,4096,1536,8,128,1,16,power_law_1.2,1.8553407669067383
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,4096,1536,8,128,2,8,balanced,0.07183466851711273
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,4096,1536,8,128,2,8,balanced,0.10406933228174846
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,4096,1536,8,128,1,16,power_law_1.2,2.5046911239624023
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,4096,1536,8,128,2,8,balanced,0.07243200143178304
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,4096,1536,8,128,2,8,balanced,0.10528533657391866
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,4096,1536,8,128,2,8,balanced,0.07273066540559132
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,4096,1536,8,128,1,16,power_law_1.2,2.9999935150146486
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,4096,1536,8,128,2,8,balanced,0.10586667060852051
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,4096,1536,8,128,2,8,balanced,0.07254933317502339
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,4096,1536,8,128,2,8,balanced,0.11338667074839275
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,4096,1536,8,128,1,16,power_law_1.2,4.883212661743164
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,4096,1536,8,128,2,8,balanced,0.07380266487598419
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,4096,1536,8,128,2,8,balanced,0.1165013313293457
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,4096,1536,8,128,2,8,balanced,0.07406400144100189
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,4096,1536,8,128,2,8,balanced,0.11968533198038737
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,4096,1536,8,128,1,16,power_law_1.2,11.662566375732421
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,4096,1536,8,128,2,8,balanced,0.07497066756089528
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,4096,1536,8,128,2,8,balanced,0.12589333454767862
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,4096,1536,8,128,2,8,balanced,0.07688533266385396
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,4096,1536,8,128,2,8,balanced,0.07815466821193695
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,4096,1536,8,128,2,8,balanced,0.13322133819262186
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,4096,1536,8,128,2,8,power_law_1.01,0.06322559714317322
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,4096,1536,8,128,2,8,balanced,0.08368000388145447
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,4096,1536,8,128,2,8,balanced,0.14467733105023703
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,4096,1536,8,128,2,8,balanced,0.029322666426499683
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,4096,1536,8,128,2,8,balanced,0.08412266770998637
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,4096,1536,8,128,2,8,power_law_1.01,0.05555840134620667
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,4096,1536,8,128,2,8,balanced,0.030991998811562855
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,4096,1536,8,128,2,8,power_law_1.01,0.04714879989624023
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,4096,1536,8,128,2,8,balanced,0.15617600083351135
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,4096,1536,8,128,2,8,balanced,0.09158933162689209
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,4096,1536,8,128,2,8,balanced,0.03316266586383184
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,4096,1536,8,128,2,8,power_law_1.01,0.05912320017814636
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,4096,1536,8,128,2,8,balanced,0.09779199957847595
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,4096,1536,8,128,2,8,balanced,0.04773333172003428
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,4096,1536,8,128,2,8,power_law_1.01,0.07453439831733703
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,4096,1536,8,128,2,8,balanced,0.20545067389806113
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,4096,1536,8,128,2,8,balanced,0.10691199700037639
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,4096,1536,8,128,2,8,balanced,0.0662720004717509
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,4096,1536,8,128,2,8,power_law_1.01,0.092985600233078
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,4096,1536,8,128,2,8,power_law_1.01,0.09401599764823913
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,4096,1536,8,128,2,8,balanced,0.11768000324567159
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,4096,1536,8,128,2,8,balanced,0.06706133484840393
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,4096,1536,8,128,2,8,balanced,0.21967999140421549
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,4096,1536,8,128,2,8,power_law_1.01,0.04752640128135681
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,4096,1536,8,128,2,8,balanced,0.06777599950631459
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,4096,1536,8,128,2,8,power_law_1.01,0.09761279821395874
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,4096,1536,8,128,2,8,balanced,0.13150399923324585
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,4096,1536,8,128,2,8,power_law_1.01,0.043756800889968875
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,4096,1536,8,128,2,8,balanced,0.06879466772079468
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,4096,1536,8,128,2,8,power_law_1.01,0.09861119985580444
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,4096,1536,8,128,2,8,balanced,0.06900799771149953
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,4096,1536,8,128,2,8,power_law_1.01,0.10388480424880982
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,4096,1536,8,128,2,8,power_law_1.01,0.038176000118255615
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,4096,1536,8,128,2,8,balanced,0.2999040087064107
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,4096,1536,8,128,2,8,balanced,0.17669866482416788
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,4096,1536,8,128,2,8,power_law_1.01,0.10543999671936036
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,4096,1536,8,128,2,8,balanced,0.07025066514809926
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,4096,1536,8,128,2,8,power_law_1.01,0.051795202493667605
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,4096,1536,8,128,2,8,power_law_1.01,0.10702719688415527
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,4096,1536,8,128,2,8,balanced,0.07076266904671986
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,4096,1536,8,128,2,8,power_law_1.01,0.05482879877090454
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,4096,1536,8,128,2,8,power_law_1.01,0.11218559741973877
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,4096,1536,8,128,2,8,balanced,0.07227199772993724
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,4096,1536,8,128,2,8,power_law_1.01,0.06843519806861878
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,4096,1536,8,128,2,8,balanced,0.2062399983406067
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,4096,1536,8,128,2,8,balanced,0.07493866483370464
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,4096,1536,8,128,2,8,power_law_1.01,0.06961920261383056
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,4096,1536,8,128,2,8,power_law_1.01,0.1155519962310791
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,4096,1536,8,128,2,8,balanced,0.33747732639312744
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,4096,1536,8,128,2,8,balanced,0.0765173335870107
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,4096,1536,8,128,2,8,power_law_1.01,0.07060480117797852
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,4096,1536,8,128,2,8,power_law_1.01,0.12331520318984986
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,4096,1536,8,128,2,8,power_law_1.01,0.12691199779510498
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,4096,1536,8,128,2,8,power_law_1.01,0.07179520130157471
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,4096,1536,8,128,2,8,balanced,0.2853386600812276
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,4096,1536,8,128,2,8,power_law_1.01,0.13596160411834718
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,4096,1536,8,128,2,8,power_law_1.01,0.07187839746475219
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,4096,1536,8,128,2,8,power_law_1.01,0.15071359872817994
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,4096,1536,8,128,2,8,power_law_1.01,0.07809919714927674
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,4096,1536,8,128,2,8,balanced,0.08437866965929668
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,4096,1536,8,128,2,8,power_law_1.01,0.17034879922866822
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,4096,1536,8,128,2,8,power_law_1.01,0.08097919821739197
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,4096,1536,8,128,2,8,balanced,0.5123200019200643
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,4096,1536,8,128,2,8,balanced,0.0853760043780009
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,4096,1536,8,128,2,8,power_law_1.01,0.08430079817771911
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,4096,1536,8,128,2,8,power_law_1.01,0.20289919376373292
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,4096,1536,8,128,2,8,balanced,0.3420693476994832
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,4096,1536,8,128,2,8,power_law_1.01,0.08281599879264831
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,4096,1536,8,128,2,8,power_law_1.01,0.2272576093673706
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,4096,1536,8,128,2,8,power_law_1.01,0.09360640048980713
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,4096,1536,8,128,2,8,power_law_1.01,0.3393728017807007
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,4096,1536,8,128,2,8,power_law_1.01,0.09637119770050048
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,4096,1536,8,128,2,8,power_law_1.01,0.3203775882720947
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,4096,1536,8,128,2,8,power_law_1.01,0.10005120038986207
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,4096,1536,8,128,2,8,power_law_1.01,0.11223039627075196
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,4096,1536,8,128,2,8,power_law_1.01,0.4994688034057617
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,4096,1536,8,128,2,8,balanced,0.09326400359471639
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,4096,1536,8,128,2,8,balanced,0.5110346476236979
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,4096,1536,8,128,2,8,power_law_1.01,0.1408128023147583
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,4096,1536,8,128,2,8,power_law_1.01,0.6064576148986817
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,4096,1536,8,128,2,8,balanced,0.10637332995732625
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,4096,1536,8,128,2,8,balanced,0.6419573227564493
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,4096,1536,8,128,2,8,power_law_1.01,0.15667840242385864
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,4096,1536,8,128,2,8,power_law_1.01,0.9056256294250489
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,4096,1536,8,128,2,8,balanced,0.11174933115641277
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,4096,1536,8,128,2,8,power_law_1.01,0.1902143955230713
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,4096,1536,8,128,2,8,power_law_1.01,1.170406436920166
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,4096,1536,8,128,2,8,power_law_1.01,0.24492158889770507
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,4096,1536,8,128,2,8,power_law_1.01,1.40830078125
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,4096,1536,8,128,2,8,power_law_1.01,0.31169919967651366
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,4096,1536,8,128,2,8,power_law_1.01,2.0714496612548827
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,4096,1536,8,128,2,8,power_law_1.01,0.4386688232421875
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,4096,1536,8,128,2,8,balanced,0.14098667105038962
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,4096,1536,8,128,2,8,balanced,0.6490879853566488
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,4096,1536,8,128,2,8,power_law_1.01,0.5087935924530029
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,4096,1536,8,128,2,8,power_law_1.01,4.381996917724609
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,4096,1536,8,128,2,8,balanced,0.156741331020991
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,4096,1536,8,128,2,8,power_law_1.01,0.7712512016296387
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,4096,1536,8,128,2,8,power_law_1.01,1.0115903854370116
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,4096,1536,8,128,2,8,balanced,0.817349354426066
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,4096,1536,8,128,2,8,balanced,0.23297067483266196
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,4096,1536,8,128,2,8,power_law_1.01,1.1310079574584961
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,4096,1536,8,128,2,8,power_law_1.01,0.048556798696517946
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,4096,1536,8,128,2,8,power_law_1.01,1.8946111679077149
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,4096,1536,8,128,2,8,power_law_1.01,0.03983359932899475
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,4096,1536,8,128,2,8,balanced,0.28734399875005084
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,4096,1536,8,128,2,8,power_law_1.01,0.03708159923553467
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,4096,1536,8,128,2,8,power_law_1.01,3.623014450073242
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,4096,1536,8,128,2,8,power_law_1.01,0.046623998880386354
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,4096,1536,8,128,2,8,power_law_1.01,0.05425919890403748
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,4096,1536,8,128,2,8,balanced,0.8164693514506022
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,4096,1536,8,128,2,8,power_law_1.01,0.06676480174064636
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,4096,1536,8,128,2,8,power_law_1.01,0.06779519915580749
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,4096,1536,8,128,2,8,power_law_1.01,0.06937599778175355
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,4096,1536,8,128,2,8,power_law_1.01,0.0682752013206482
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,4096,1536,8,128,2,8,power_law_1.01,0.07255039811134338
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,4096,1536,8,128,2,8,balanced,0.41678400834401447
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,4096,1536,8,128,2,8,power_law_1.01,0.07527679800987244
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,4096,1536,8,128,2,8,power_law_1.01,0.0820032000541687
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,4096,1536,8,128,2,8,power_law_1.01,0.09157760143280029
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,4096,1536,8,128,2,8,power_law_1.01,0.09546239972114563
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,4096,1536,8,128,2,8,power_law_1.2,0.06286079883575439
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,4096,1536,8,128,2,8,balanced,0.5287040074666342
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,4096,1536,8,128,2,8,balanced,1.2618559996287029
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,4096,1536,8,128,2,8,power_law_1.2,0.04156799912452698
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,4096,1536,8,128,2,8,power_law_1.01,0.1034432053565979
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,4096,1536,8,128,2,8,power_law_1.2,0.04649600088596344
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,4096,1536,8,128,2,8,power_law_1.2,0.05456640124320984
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,4096,1536,8,128,2,8,power_law_1.01,0.11155840158462524
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,4096,1536,8,128,2,8,power_law_1.2,0.07340160012245178
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,4096,1536,8,128,2,8,power_law_1.2,0.0929535984992981
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,4096,1536,8,128,2,8,power_law_1.2,0.09388160109519958
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,4096,1536,8,128,2,8,power_law_1.01,0.10766079425811767
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,4096,1536,8,128,2,8,balanced,1.2269813219706218
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,4096,1536,8,128,2,8,balanced,0.7798026402791342
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,4096,1536,8,128,2,8,power_law_1.2,0.0995519995689392
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,4096,1536,8,128,2,8,power_law_1.2,0.09910399913787842
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,4096,1536,8,128,2,8,power_law_1.01,0.13904000520706178
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,4096,1536,8,128,2,8,power_law_1.2,0.10339839458465576
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,4096,1536,8,128,2,8,power_law_1.01,0.15521279573440552
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,4096,1536,8,128,2,8,power_law_1.2,0.10721280574798583
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,4096,1536,8,128,2,8,power_law_1.2,0.10901119709014892
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,4096,1536,8,128,2,8,power_law_1.01,0.21187200546264648
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,4096,1536,8,128,2,8,power_law_1.2,0.11854720115661621
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,4096,1536,8,128,2,8,power_law_1.01,0.2614272117614746
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,4096,1536,8,128,2,8,power_law_1.2,0.11660159826278686
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,4096,1536,8,128,2,8,power_law_1.2,0.12723840475082399
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,4096,1536,8,128,2,8,power_law_1.01,0.34088959693908694
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,4096,1536,8,128,2,8,power_law_1.2,0.1374783992767334
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,4096,1536,8,128,2,8,balanced,1.0323253472646077
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,4096,1536,8,128,2,8,power_law_1.2,0.13994879722595216
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,4096,1536,8,128,2,8,power_law_1.01,0.4495488166809082
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,4096,1536,8,128,2,8,power_law_1.2,0.1674880027770996
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,4096,1536,8,128,2,8,power_law_1.2,0.18978559970855713
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,4096,1536,8,128,2,8,power_law_1.01,0.7211904048919677
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,4096,1536,8,128,2,8,power_law_1.2,0.21539840698242188
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,4096,1536,8,128,2,8,power_law_1.01,0.7802815914154053
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,4096,1536,8,128,2,8,power_law_1.2,0.2597055912017822
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,4096,1536,8,128,2,8,power_law_1.2,0.306060791015625
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,4096,1536,8,128,2,8,power_law_1.01,1.223583984375
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,4096,1536,8,128,2,8,power_law_1.2,0.3748543977737427
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,4096,1536,8,128,2,8,power_law_1.01,1.9229503631591798
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,4096,1536,8,128,2,8,power_law_1.2,0.5091072082519531
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,4096,1536,8,128,2,8,power_law_1.01,2.0151424407958984
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,4096,1536,8,128,2,8,power_law_1.2,0.6930624008178711
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,4096,1536,8,128,2,8,power_law_1.01,3.7930431365966797
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,4096,1536,8,128,2,8,balanced,1.2865386803944905
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,4096,1536,8,128,2,8,power_law_1.2,0.943667221069336
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,4096,1536,8,128,2,8,power_law_1.2,0.047705599665641786
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,4096,1536,8,128,2,8,power_law_1.2,1.2974271774291992
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,4096,1536,8,128,2,8,power_law_1.01,7.214323425292969
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,4096,1536,8,128,2,8,power_law_1.2,0.03528960049152374
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,4096,1536,8,128,2,8,power_law_1.2,1.7085695266723633
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,4096,1536,8,128,2,8,power_law_1.2,0.038227200508117676
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,4096,1536,8,128,2,8,power_law_1.2,2.3434112548828123
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,4096,1536,8,128,2,8,balanced,2.447813351949056
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,4096,1536,8,128,2,8,power_law_1.2,0.04563199877738953
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,4096,1536,8,128,2,8,power_law_1.2,0.057715201377868654
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,4096,1536,8,128,2,8,power_law_1.2,7.857977294921875
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,4096,1536,8,128,2,8,power_law_1.2,0.06816639900207519
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,4096,1536,8,128,2,8,power_law_1.2,0.06874880194664001
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,4096,1536,8,128,2,8,balanced,2.383471965789795
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,4096,1536,8,128,2,8,power_law_1.2,0.07118719816207886
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,4096,1536,8,128,2,8,power_law_1.2,0.0722815990447998
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,4096,1536,8,128,2,8,power_law_1.2,0.07181439995765686
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,4096,1536,8,128,2,8,balanced,2.045269330342611
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,4096,1536,8,128,2,8,power_law_1.2,0.07838720083236694
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,4096,1536,8,128,2,8,power_law_1.2,0.08190720081329346
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,4096,1536,8,128,2,8,power_law_1.2,0.08826879858970642
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,4096,1536,8,128,2,8,power_law_1.2,0.08716800212860107
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,4096,1536,8,128,2,8,power_law_1.2,0.09530240297317505
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,4096,1536,8,128,2,8,power_law_1.2,0.09928320050239563
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,4096,1536,8,128,2,8,power_law_1.2,0.10599679946899414
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,4096,1536,8,128,2,8,power_law_1.2,0.1221951961517334
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,4096,1536,8,128,2,8,power_law_1.2,0.13786239624023439
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,4096,1536,8,128,2,8,power_law_1.2,0.16568959951400758
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,4096,1536,8,128,2,8,power_law_1.2,0.20894079208374022
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,4096,1536,8,128,2,8,power_law_1.2,0.30995199680328367
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,4096,1536,8,128,2,8,power_law_1.2,0.3602816104888916
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,4096,1536,8,128,2,8,power_law_1.2,0.45798401832580565
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,4096,1536,8,128,2,8,power_law_1.2,0.580025577545166
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,4096,1536,8,128,2,8,power_law_1.2,0.9044032096862793
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,4096,1536,8,128,2,8,power_law_1.2,1.1910783767700195
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,4096,1536,8,128,2,8,power_law_1.2,1.7124095916748048
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,4096,1536,8,128,2,8,power_law_1.2,2.169254493713379
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,4096,1536,8,128,2,8,power_law_1.2,5.722227096557617
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,4096,1536,8,128,2,8,balanced,4.0096588134765625
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,4096,1536,8,128,2,8,power_law_1.2,0.04835839867591858
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,4096,1536,8,128,2,8,power_law_1.2,0.03516800105571747
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,4096,1536,8,128,2,8,power_law_1.2,0.037299200892448425
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,4096,1536,8,128,4,4,balanced,0.03678400069475174
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,4096,1536,8,128,2,8,power_law_1.2,0.04471679925918579
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,4096,1536,8,128,4,4,balanced,0.037621334195137024
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,4096,1536,8,128,2,8,power_law_1.2,0.049267199635505673
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,4096,1536,8,128,4,4,balanced,0.046442667643229164
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,4096,1536,8,128,2,8,power_law_1.2,0.06535680294036865
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,4096,1536,8,128,4,4,balanced,0.06780266761779785
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,4096,1536,8,128,2,8,power_law_1.2,0.06792960166931153
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,4096,1536,8,128,4,4,balanced,0.10030933221181233
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,4096,1536,8,128,2,8,power_law_1.2,0.07078400254249573
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,4096,1536,8,128,4,4,balanced,0.10259200135866801
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,4096,1536,8,128,4,4,balanced,0.10332266489664714
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,4096,1536,8,128,2,8,power_law_1.2,0.07255679965019227
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,4096,1536,8,128,4,4,balanced,0.10384533802668254
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,4096,1536,8,128,2,8,power_law_1.2,0.07431679964065552
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,4096,1536,8,128,4,4,balanced,0.10426666339238484
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,4096,1536,8,128,2,8,power_law_1.2,0.08184319734573364
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,4096,1536,8,128,4,4,balanced,0.10450133681297302
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,4096,1536,8,128,2,8,power_law_1.2,0.08632320165634155
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,4096,1536,8,128,4,4,balanced,0.10529067118962605
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,4096,1536,8,128,2,8,power_law_1.2,0.08873599767684937
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,4096,1536,8,128,4,4,balanced,0.10677867134412129
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,4096,1536,8,128,2,8,power_law_1.2,0.09649279713630676
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,4096,1536,8,128,4,4,balanced,0.1086346705754598
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,4096,1536,8,128,4,4,balanced,0.1102239986260732
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,4096,1536,8,128,2,8,power_law_1.2,0.10306559801101685
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,4096,1536,8,128,4,4,balanced,0.11762666702270508
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,4096,1536,8,128,4,4,balanced,0.12179733316103618
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,4096,1536,8,128,2,8,power_law_1.2,0.11296639442443848
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,4096,1536,8,128,4,4,balanced,0.1274079978466034
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,4096,1536,8,128,2,8,power_law_1.2,0.11881599426269532
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,4096,1536,8,128,4,4,balanced,0.1378986636797587
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,4096,1536,8,128,2,8,power_law_1.2,0.14137599468231202
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,4096,1536,8,128,4,4,balanced,0.1481066644191742
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,4096,1536,8,128,2,8,power_law_1.2,0.1721343994140625
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,4096,1536,8,128,4,4,balanced,0.16410133242607117
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,4096,1536,8,128,2,8,power_law_1.2,0.2201024055480957
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,4096,1536,8,128,2,8,power_law_1.2,0.27217280864715576
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,4096,1536,8,128,4,4,balanced,0.1770346760749817
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,4096,1536,8,128,2,8,power_law_1.2,0.40619521141052245
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,4096,1536,8,128,2,8,power_law_1.2,0.5632319927215577
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,4096,1536,8,128,4,4,balanced,0.23586666584014893
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,4096,1536,8,128,2,8,power_law_1.2,0.8704511642456054
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,4096,1536,8,128,2,8,power_law_1.2,1.077824020385742
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,4096,1536,8,128,4,4,balanced,0.27195199330647785
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,4096,1536,8,128,2,8,power_law_1.2,1.571571159362793
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,4096,1536,8,128,2,8,power_law_1.2,2.0755712509155275
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,4096,1536,8,128,2,8,power_law_1.2,3.1618175506591797
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,4096,1536,8,128,4,4,balanced,0.3791840076446533
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,4096,1536,8,128,2,8,power_law_1.2,5.355436706542969
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,4096,1536,8,128,4,4,balanced,0.033146666983763375
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,4096,1536,8,128,2,8,power_law_1.2,11.464192199707032
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,4096,1536,8,128,4,4,balanced,0.03396799912055334
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,4096,1536,8,128,4,4,balanced,0.4549119869867961
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,4096,1536,8,128,4,4,balanced,0.037952000896135964
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,4096,1536,8,128,4,4,balanced,0.05312533179918925
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,4096,1536,8,128,4,4,power_law_1.01,0.04567039906978607
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,4096,1536,8,128,4,4,balanced,0.07638933261235555
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,4096,1536,8,128,4,4,power_law_1.01,0.036396801471710205
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,4096,1536,8,128,4,4,power_law_1.01,0.03923200070858002
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,4096,1536,8,128,4,4,balanced,0.07506666580835979
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,4096,1536,8,128,4,4,power_law_1.01,0.04286080002784729
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,4096,1536,8,128,4,4,power_law_1.01,0.03733760118484497
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,4096,1536,8,128,4,4,balanced,0.07551999886830647
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,4096,1536,8,128,4,4,power_law_1.01,0.059468799829483034
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,4096,1536,8,128,4,4,balanced,0.6853280067443848
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,4096,1536,8,128,4,4,power_law_1.01,0.03761920034885406
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,4096,1536,8,128,4,4,power_law_1.01,0.06798080205917359
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,4096,1536,8,128,4,4,balanced,0.07663999994595845
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,4096,1536,8,128,4,4,power_law_1.01,0.09094399809837342
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,4096,1536,8,128,4,4,power_law_1.01,0.050547200441360476
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,4096,1536,8,128,4,4,balanced,0.07659199833869934
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,4096,1536,8,128,4,4,power_law_1.01,0.09335039854049683
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,4096,1536,8,128,4,4,power_law_1.01,0.05381119847297668
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,4096,1536,8,128,4,4,power_law_1.01,0.0910975992679596
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,4096,1536,8,128,4,4,balanced,0.07754666606585185
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,4096,1536,8,128,4,4,power_law_1.01,0.09966719746589661
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,4096,1536,8,128,4,4,power_law_1.01,0.07074559926986694
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,4096,1536,8,128,4,4,balanced,0.0782773345708847
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,4096,1536,8,128,4,4,power_law_1.01,0.10585600137710571
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,4096,1536,8,128,4,4,balanced,0.034287999073664345
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,4096,1536,8,128,4,4,power_law_1.01,0.07144320011138916
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,4096,1536,8,128,4,4,power_law_1.01,0.10490880012512208
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,4096,1536,8,128,4,4,balanced,0.08108800152937572
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,4096,1536,8,128,4,4,power_law_1.01,0.10837759971618652
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,4096,1536,8,128,4,4,power_law_1.01,0.07260800004005433
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,4096,1536,8,128,4,4,balanced,0.03536533315976461
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,4096,1536,8,128,4,4,balanced,0.08181866506735484
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,4096,1536,8,128,4,4,power_law_1.01,0.10891519784927368
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,4096,1536,8,128,4,4,balanced,0.03864533454179764
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,4096,1536,8,128,4,4,power_law_1.01,0.07346559762954712
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,4096,1536,8,128,4,4,balanced,0.08400000135103862
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,4096,1536,8,128,4,4,power_law_1.01,0.1192896008491516
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,4096,1536,8,128,4,4,balanced,0.8608693281809489
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,4096,1536,8,128,4,4,balanced,0.05209066470464071
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,4096,1536,8,128,4,4,power_law_1.01,0.1256767988204956
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,4096,1536,8,128,4,4,power_law_1.01,0.07546240091323853
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,4096,1536,8,128,4,4,balanced,0.09070932865142822
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,4096,1536,8,128,4,4,power_law_1.01,0.1303104043006897
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,4096,1536,8,128,4,4,balanced,0.07191999753316243
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,4096,1536,8,128,4,4,power_law_1.01,0.08341119885444641
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,4096,1536,8,128,4,4,power_law_1.01,0.14967039823532105
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,4096,1536,8,128,4,4,balanced,0.09303466478983562
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,4096,1536,8,128,4,4,balanced,0.07392533123493195
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,4096,1536,8,128,4,4,power_law_1.01,0.17485439777374268
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,4096,1536,8,128,4,4,power_law_1.01,0.0824832022190094
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,4096,1536,8,128,4,4,balanced,0.07558399935563405
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,4096,1536,8,128,4,4,balanced,0.10032000144322713
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,4096,1536,8,128,4,4,power_law_1.01,0.19797120094299317
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,4096,1536,8,128,4,4,balanced,0.07585066556930542
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,4096,1536,8,128,4,4,power_law_1.01,0.08633599877357483
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,4096,1536,8,128,4,4,power_law_1.01,0.21578879356384278
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,4096,1536,8,128,4,4,balanced,0.11180266737937927
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,4096,1536,8,128,4,4,balanced,0.07686399916807811
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,4096,1536,8,128,4,4,power_law_1.01,0.2663039922714233
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,4096,1536,8,128,4,4,power_law_1.01,0.08996480107307434
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,4096,1536,8,128,4,4,balanced,0.07834666470686595
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,4096,1536,8,128,4,4,power_law_1.01,0.33159680366516114
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,4096,1536,8,128,4,4,power_law_1.01,0.09809280037879944
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,4096,1536,8,128,4,4,balanced,0.12139733632405598
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,4096,1536,8,128,4,4,power_law_1.01,0.34552960395812987
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,4096,1536,8,128,4,4,balanced,0.08036266764005025
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,4096,1536,8,128,4,4,power_law_1.01,0.4797376155853271
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,4096,1536,8,128,4,4,power_law_1.01,0.10359679460525513
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,4096,1536,8,128,4,4,balanced,0.0825493335723877
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,4096,1536,8,128,4,4,balanced,0.1395840048789978
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,4096,1536,8,128,4,4,power_law_1.01,0.6668096065521241
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,4096,1536,8,128,4,4,balanced,0.0855519970258077
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,4096,1536,8,128,4,4,power_law_1.01,0.10718079805374145
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,4096,1536,8,128,4,4,power_law_1.01,0.9009471893310547
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,4096,1536,8,128,4,4,balanced,0.08878399928410848
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,4096,1536,8,128,4,4,balanced,1.0961013634999592
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,4096,1536,8,128,4,4,power_law_1.01,0.127347195148468
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,4096,1536,8,128,4,4,balanced,0.15575466553370157
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,4096,1536,8,128,4,4,power_law_1.01,1.164352035522461
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,4096,1536,8,128,4,4,power_law_1.01,0.14783999919891358
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,4096,1536,8,128,4,4,power_law_1.01,1.4292223930358887
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,4096,1536,8,128,4,4,power_law_1.01,0.17701120376586915
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,4096,1536,8,128,4,4,balanced,0.21809599796930948
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,4096,1536,8,128,4,4,power_law_1.01,2.1831296920776366
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,4096,1536,8,128,4,4,power_law_1.01,0.1997696042060852
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,4096,1536,8,128,4,4,balanced,0.10190932949384053
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,4096,1536,8,128,4,4,power_law_1.01,4.335091018676758
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,4096,1536,8,128,4,4,power_law_1.01,0.26484479904174807
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,4096,1536,8,128,4,4,balanced,0.10372799634933472
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,4096,1536,8,128,4,4,balanced,0.26197866598765057
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,4096,1536,8,128,4,4,power_law_1.01,0.3279167890548706
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,4096,1536,8,128,4,4,power_law_1.01,0.4430975914001465
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,4096,1536,8,128,4,4,power_law_1.01,0.5770112037658691
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,4096,1536,8,128,4,4,balanced,0.3709706862767537
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,4096,1536,8,128,4,4,power_law_1.01,0.8297727584838868
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,4096,1536,8,128,4,4,power_law_1.01,1.050278377532959
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,4096,1536,8,128,4,4,balanced,0.11926933129628499
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,4096,1536,8,128,4,4,power_law_1.01,1.3845760345458984
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,4096,1536,8,128,4,4,balanced,0.13995200395584106
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,4096,1536,8,128,4,4,power_law_1.01,1.9652416229248046
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,4096,1536,8,128,4,4,balanced,0.4569760163625081
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,4096,1536,8,128,4,4,balanced,0.14756266276041666
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,4096,1536,8,128,4,4,power_law_1.2,0.044972801208496095
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,4096,1536,8,128,4,4,balanced,1.6439733505249023
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,4096,1536,8,128,4,4,power_law_1.01,0.03969280123710632
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,4096,1536,8,128,4,4,power_law_1.01,4.126649475097656
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,4096,1536,8,128,4,4,power_law_1.2,0.03816959857940674
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,4096,1536,8,128,4,4,power_law_1.01,0.038431999087333676
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,4096,1536,8,128,4,4,power_law_1.2,0.046348801255226134
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,4096,1536,8,128,4,4,power_law_1.01,0.03971199989318848
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,4096,1536,8,128,4,4,balanced,0.20033599932988486
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,4096,1536,8,128,4,4,power_law_1.2,0.053964799642562865
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,4096,1536,8,128,4,4,power_law_1.01,0.04874880015850067
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,4096,1536,8,128,4,4,power_law_1.2,0.06647679805755616
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,4096,1536,8,128,4,4,balanced,0.6899840037027994
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,4096,1536,8,128,4,4,power_law_1.01,0.05246719717979431
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,4096,1536,8,128,4,4,balanced,0.24627200762430826
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,4096,1536,8,128,4,4,power_law_1.2,0.09066879749298096
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,4096,1536,8,128,4,4,power_law_1.01,0.0699455976486206
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,4096,1536,8,128,4,4,power_law_1.2,0.09029120206832886
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,4096,1536,8,128,4,4,power_law_1.01,0.07371519804000855
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,4096,1536,8,128,4,4,balanced,0.3683040142059326
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,4096,1536,8,128,4,4,power_law_1.2,0.09590399861335755
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,4096,1536,8,128,4,4,power_law_1.01,0.07681279778480529
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,4096,1536,8,128,4,4,power_law_1.2,0.10295679569244384
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,4096,1536,8,128,4,4,power_law_1.01,0.07682560086250305
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,4096,1536,8,128,4,4,balanced,0.4428639809290568
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,4096,1536,8,128,4,4,power_law_1.2,0.10232319831848144
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,4096,1536,8,128,4,4,power_law_1.01,0.0825984001159668
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,4096,1536,8,128,4,4,power_law_1.2,0.10666879415512084
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,4096,1536,8,128,4,4,power_law_1.01,0.08780159950256347
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,4096,1536,8,128,4,4,balanced,0.8898613452911377
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,4096,1536,8,128,4,4,power_law_1.2,0.11081600189208984
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,4096,1536,8,128,4,4,power_law_1.2,0.10904959440231324
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,4096,1536,8,128,4,4,power_law_1.01,0.09374079704284669
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,4096,1536,8,128,4,4,balanced,0.6430559953053793
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,4096,1536,8,128,4,4,power_law_1.2,0.12183680534362792
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,4096,1536,8,128,4,4,power_law_1.01,0.10027519464492798
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,4096,1536,8,128,4,4,power_law_1.2,0.1251904010772705
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,4096,1536,8,128,4,4,power_law_1.01,0.10895999670028686
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,4096,1536,8,128,4,4,power_law_1.2,0.14011520147323608
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,4096,1536,8,128,4,4,power_law_1.2,0.15688960552215575
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,4096,1536,8,128,4,4,balanced,0.8311039606730143
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,4096,1536,8,128,4,4,power_law_1.01,0.11902079582214356
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,4096,1536,8,128,4,4,power_law_1.2,0.18398720026016235
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,4096,1536,8,128,4,4,power_law_1.01,0.13244800567626952
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,4096,1536,8,128,4,4,power_law_1.2,0.19896960258483887
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,4096,1536,8,128,4,4,power_law_1.2,0.24554879665374757
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,4096,1536,8,128,4,4,power_law_1.2,0.2750400066375732
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,4096,1536,8,128,4,4,balanced,1.1100266774495442
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,4096,1536,8,128,4,4,power_law_1.01,0.1335744023323059
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,4096,1536,8,128,4,4,power_law_1.2,0.37816319465637205
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,4096,1536,8,128,4,4,power_law_1.2,0.3891007900238037
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,4096,1536,8,128,4,4,power_law_1.01,0.1682368040084839
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,4096,1536,8,128,4,4,balanced,1.2334667046864827
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,4096,1536,8,128,4,4,power_law_1.2,0.5359104156494141
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,4096,1536,8,128,4,4,power_law_1.01,0.19336960315704346
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,4096,1536,8,128,4,4,power_law_1.2,0.670252799987793
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,4096,1536,8,128,4,4,balanced,3.211375872294108
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,4096,1536,8,128,4,4,power_law_1.01,0.2668159961700439
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,4096,1536,8,128,4,4,power_law_1.2,1.0819775581359863
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,4096,1536,8,128,4,4,power_law_1.01,0.3445183992385864
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,4096,1536,8,128,4,4,power_law_1.2,1.475558376312256
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,4096,1536,8,128,4,4,power_law_1.01,0.4827583789825439
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,4096,1536,8,128,4,4,power_law_1.2,1.799590492248535
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,4096,1536,8,128,4,4,power_law_1.01,0.5915647983551026
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,4096,1536,8,128,4,4,power_law_1.2,2.858515167236328
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,4096,1536,8,128,4,4,balanced,1.6303787231445312
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,4096,1536,8,128,4,4,power_law_1.01,0.9546175956726074
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,4096,1536,8,128,4,4,power_law_1.2,6.409625244140625
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,4096,1536,8,128,4,4,power_law_1.01,1.1577664375305177
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,4096,1536,8,128,4,4,power_law_1.01,1.494431972503662
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,4096,1536,8,128,4,4,balanced,1.6901226043701172
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,4096,1536,8,128,4,4,power_law_1.01,2.018367958068848
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,4096,1536,8,128,4,4,power_law_1.01,2.817862319946289
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,4096,1536,8,128,4,4,power_law_1.01,4.742892837524414
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,4096,1536,8,128,4,4,balanced,2.024789333343506
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,4096,1536,8,128,4,4,power_law_1.01,8.3611328125
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,4096,1536,8,128,4,4,power_law_1.2,0.03646079897880554
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,4096,1536,8,128,4,4,power_law_1.2,0.03460479974746704
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,4096,1536,8,128,4,4,power_law_1.2,0.03857280015945434
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,4096,1536,8,128,4,4,power_law_1.2,0.048172798752784726
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,4096,1536,8,128,4,4,power_law_1.2,0.05121279954910278
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,4096,1536,8,128,4,4,power_law_1.2,0.06958079934120179
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,4096,1536,8,128,4,4,power_law_1.2,0.07189760208129883
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,4096,1536,8,128,4,4,power_law_1.2,0.07533439993858337
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,4096,1536,8,128,4,4,power_law_1.2,0.0753600001335144
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,4096,1536,8,128,4,4,power_law_1.2,0.07643520236015319
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,4096,1536,8,128,4,4,power_law_1.2,0.07989760041236878
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,4096,1536,8,128,4,4,balanced,3.2079200744628906
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,4096,1536,8,128,4,4,power_law_1.2,0.08409600257873535
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,4096,1536,8,128,4,4,power_law_1.2,0.09048320055007934
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,4096,1536,8,128,4,4,power_law_1.2,0.09289600253105164
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,4096,1536,8,128,4,4,power_law_1.2,0.10156799554824829
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,4096,1536,8,128,4,4,power_law_1.2,0.10610560178756714
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,4096,1536,8,128,4,4,power_law_1.2,0.12094080448150635
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,4096,1536,8,128,4,4,power_law_1.2,0.13349759578704834
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,4096,1536,8,128,4,4,balanced,3.2741066614786782
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,4096,1536,8,128,4,4,power_law_1.2,0.15288959741592406
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,4096,1536,8,128,4,4,power_law_1.2,0.1782912015914917
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,4096,1536,8,128,4,4,power_law_1.2,0.22148480415344238
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,4096,1536,8,128,4,4,power_law_1.2,0.29616000652313235
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,4096,1536,8,128,4,4,power_law_1.2,0.3354880094528198
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,4096,1536,8,128,4,4,power_law_1.2,0.03964160084724426
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,4096,1536,8,128,4,4,power_law_1.2,0.514470386505127
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,4096,1536,8,128,4,4,power_law_1.2,0.03808639943599701
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,4096,1536,8,128,4,4,power_law_1.2,0.6739456176757812
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,4096,1536,8,128,4,4,power_law_1.2,0.04131200015544891
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,4096,1536,8,128,4,4,power_law_1.2,0.876371192932129
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,4096,1536,8,128,4,4,power_law_1.2,0.04854399859905243
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,4096,1536,8,128,4,4,power_law_1.2,1.21146240234375
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,4096,1536,8,128,4,4,power_law_1.2,0.053273600339889524
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,4096,1536,8,128,4,4,power_law_1.2,1.747091293334961
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,4096,1536,8,128,4,4,power_law_1.2,0.07177600264549255
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,4096,1536,8,128,4,4,power_law_1.2,0.07341439723968506
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,4096,1536,8,128,4,4,power_law_1.2,2.6450048446655274
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,4096,1536,8,128,4,4,power_law_1.2,0.0766975998878479
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,4096,1536,8,128,4,4,power_law_1.2,0.0793727993965149
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,4096,1536,8,128,4,4,power_law_1.2,5.537843322753906
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,4096,1536,8,128,4,4,power_law_1.2,0.08332800269126892
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,4096,1536,8,128,8,2,balanced,0.036874666810035706
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,4096,1536,8,128,4,4,power_law_1.2,0.08979840278625488
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,4096,1536,8,128,8,2,balanced,0.04050666590531667
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,4096,1536,8,128,4,4,power_law_1.2,0.09880319833755494
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,4096,1536,8,128,4,4,balanced,6.3354237874348955
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,4096,1536,8,128,8,2,balanced,0.051072001457214355
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,4096,1536,8,128,4,4,power_law_1.2,0.10090880393981934
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,4096,1536,8,128,8,2,balanced,0.07054933408896129
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,4096,1536,8,128,4,4,power_law_1.2,0.1109120011329651
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,4096,1536,8,128,8,2,balanced,0.10714133580525716
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,4096,1536,8,128,8,2,balanced,0.1095306674639384
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,4096,1536,8,128,8,2,balanced,0.1129866639773051
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,4096,1536,8,128,4,4,power_law_1.2,0.12017920017242431
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,4096,1536,8,128,8,2,balanced,0.10973866780598958
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,4096,1536,8,128,4,4,power_law_1.2,0.13074560165405275
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,4096,1536,8,128,8,2,balanced,0.11085333426793416
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,4096,1536,8,128,8,2,balanced,0.1113866666952769
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,4096,1536,8,128,4,4,power_law_1.2,0.1432960033416748
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,4096,1536,8,128,8,2,balanced,0.11218133568763733
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,4096,1536,8,128,4,4,power_law_1.2,0.17687679529190065
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,4096,1536,8,128,8,2,balanced,0.11477333307266235
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,4096,1536,8,128,4,4,power_law_1.2,0.21092479228973388
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,4096,1536,8,128,8,2,balanced,0.11667199929555257
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,4096,1536,8,128,8,2,balanced,0.11941333611806233
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,4096,1536,8,128,4,4,power_law_1.2,0.30008320808410643
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,4096,1536,8,128,8,2,balanced,0.1283146639664968
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,4096,1536,8,128,4,4,power_law_1.2,0.37046399116516116
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,4096,1536,8,128,8,2,balanced,0.13525333007176718
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,4096,1536,8,128,4,4,power_law_1.2,0.4906752109527588
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,4096,1536,8,128,8,2,balanced,0.14455466469128928
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,4096,1536,8,128,4,4,power_law_1.2,0.6160128116607666
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,4096,1536,8,128,8,2,balanced,0.16123732924461365
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,4096,1536,8,128,4,4,power_law_1.2,0.9348992347717285
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,4096,1536,8,128,8,2,balanced,0.17429866393407187
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,4096,1536,8,128,4,4,power_law_1.2,1.2649727821350099
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,4096,1536,8,128,4,4,power_law_1.2,1.906867218017578
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,4096,1536,8,128,8,2,balanced,0.20002132654190063
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,4096,1536,8,128,4,4,power_law_1.2,2.2471359252929686
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,4096,1536,8,128,8,2,balanced,0.22218666474024454
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,4096,1536,8,128,8,2,balanced,0.03505066782236099
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,4096,1536,8,128,4,4,power_law_1.2,2.9306047439575194
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,4096,1536,8,128,8,2,balanced,0.03686933219432831
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,4096,1536,8,128,4,4,power_law_1.2,5.130464172363281
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,4096,1536,8,128,8,2,balanced,0.31204267342885333
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,4096,1536,8,128,8,2,balanced,0.04238933324813843
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,4096,1536,8,128,8,2,balanced,0.05884799857934316
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,4096,1536,8,128,4,4,power_law_1.2,10.765599822998047
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,4096,1536,8,128,8,2,balanced,0.0855466624101003
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,4096,1536,8,128,8,2,balanced,0.3656586805979411
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,4096,1536,8,128,8,2,balanced,0.08719467123349507
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,4096,1536,8,128,8,2,balanced,0.087909330924352
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,4096,1536,8,128,8,2,balanced,0.08733866612116496
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,4096,1536,8,128,8,2,balanced,0.5396106640497843
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,4096,1536,8,128,8,2,balanced,0.08980799714724223
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,4096,1536,8,128,8,2,balanced,0.0897866686185201
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,4096,1536,8,128,8,2,balanced,0.09115200241406758
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,4096,1536,8,128,8,2,balanced,0.09389866391817729
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,4096,1536,8,128,8,2,balanced,0.6745599905649821
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,4096,1536,8,128,8,2,balanced,0.04477333525816599
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,4096,1536,8,128,8,2,balanced,0.09636267026265462
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,4096,1536,8,128,8,2,balanced,0.04762133459250132
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,4096,1536,8,128,8,2,power_law_1.01,0.04284160137176514
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,4096,1536,8,128,8,2,balanced,0.10019733508427937
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,4096,1536,8,128,8,2,balanced,0.05099200208981832
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,4096,1536,8,128,8,2,power_law_1.01,0.040089601278305055
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,4096,1536,8,128,8,2,balanced,0.10825066765149434
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,4096,1536,8,128,8,2,balanced,0.06592000027497609
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,4096,1536,8,128,8,2,power_law_1.01,0.04880639910697937
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,4096,1536,8,128,8,2,balanced,0.1118239959081014
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,4096,1536,8,128,8,2,balanced,0.09090133508046468
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,4096,1536,8,128,8,2,balanced,1.0205972989400227
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,4096,1536,8,128,8,2,power_law_1.01,0.06247040033340454
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,4096,1536,8,128,8,2,balanced,0.1264533301194509
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,4096,1536,8,128,8,2,balanced,0.09355200330416362
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,4096,1536,8,128,8,2,power_law_1.01,0.06659200191497802
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,4096,1536,8,128,8,2,balanced,0.09570667147636414
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,4096,1536,8,128,8,2,balanced,0.1442506710688273
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,4096,1536,8,128,8,2,power_law_1.01,0.09431040287017822
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,4096,1536,8,128,8,2,balanced,0.09691733121871948
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,4096,1536,8,128,8,2,balanced,0.1551413337389628
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,4096,1536,8,128,8,2,power_law_1.01,0.09496319890022278
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,4096,1536,8,128,8,2,balanced,0.09950400392214458
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,4096,1536,8,128,8,2,power_law_1.01,0.10361599922180176
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,4096,1536,8,128,8,2,balanced,0.1011199951171875
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,4096,1536,8,128,8,2,balanced,0.18399999539057413
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,4096,1536,8,128,8,2,balanced,0.10528000195821126
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,4096,1536,8,128,8,2,power_law_1.01,0.10792319774627686
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,4096,1536,8,128,8,2,balanced,0.11100266377131145
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,4096,1536,8,128,8,2,power_law_1.01,0.1131327986717224
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,4096,1536,8,128,8,2,balanced,0.21175465981165567
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,4096,1536,8,128,8,2,balanced,1.320250670115153
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,4096,1536,8,128,8,2,balanced,0.11635200182596843
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,4096,1536,8,128,8,2,power_law_1.01,0.11913599967956542
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,4096,1536,8,128,8,2,balanced,0.11949867010116577
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,4096,1536,8,128,8,2,power_law_1.01,0.1276095986366272
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,4096,1536,8,128,8,2,balanced,0.3055466612180074
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,4096,1536,8,128,8,2,power_law_1.01,0.13229440450668334
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,4096,1536,8,128,8,2,power_law_1.01,0.12737280130386353
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,4096,1536,8,128,8,2,balanced,0.36318933963775635
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,4096,1536,8,128,8,2,power_law_1.01,0.14136960506439208
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,4096,1536,8,128,8,2,balanced,0.14004266262054443
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,4096,1536,8,128,8,2,power_law_1.01,0.1486847996711731
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,4096,1536,8,128,8,2,power_law_1.01,0.15797120332717896
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,4096,1536,8,128,8,2,balanced,0.1418719987074534
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,4096,1536,8,128,8,2,power_law_1.01,0.20173439979553223
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,4096,1536,8,128,8,2,balanced,0.5586453278859457
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,4096,1536,8,128,8,2,balanced,1.6592213312784831
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,4096,1536,8,128,8,2,power_law_1.01,0.03820799887180328
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,4096,1536,8,128,8,2,power_law_1.01,0.22186241149902344
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,4096,1536,8,128,8,2,power_law_1.01,0.24925439357757567
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,4096,1536,8,128,8,2,power_law_1.01,0.0365119993686676
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,4096,1536,8,128,8,2,power_law_1.01,0.2902911901473999
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,4096,1536,8,128,8,2,power_law_1.01,0.040428799390792844
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,4096,1536,8,128,8,2,power_law_1.01,0.05187199711799621
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,4096,1536,8,128,8,2,power_law_1.01,0.38075520992279055
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,4096,1536,8,128,8,2,balanced,0.1710240046183268
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,4096,1536,8,128,8,2,balanced,0.7291306654612223
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,4096,1536,8,128,8,2,power_law_1.01,0.06021760106086731
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,4096,1536,8,128,8,2,power_law_1.01,0.4716800212860107
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,4096,1536,8,128,8,2,power_law_1.01,0.07699840068817139
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,4096,1536,8,128,8,2,balanced,0.21084266901016235
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,4096,1536,8,128,8,2,power_law_1.01,0.07825279831886292
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,4096,1536,8,128,8,2,power_law_1.01,0.6283967971801758
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,4096,1536,8,128,8,2,power_law_1.01,0.08238720297813415
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,4096,1536,8,128,8,2,balanced,0.24484266837437949
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,4096,1536,8,128,8,2,power_law_1.01,0.825062370300293
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,4096,1536,8,128,8,2,power_law_1.01,0.08750720024108886
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,4096,1536,8,128,8,2,power_law_1.01,0.08825600147247314
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,4096,1536,8,128,8,2,power_law_1.01,1.1490752220153808
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,4096,1536,8,128,8,2,power_law_1.01,0.09423999786376953
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,4096,1536,8,128,8,2,power_law_1.01,0.09927039742469787
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,4096,1536,8,128,8,2,power_law_1.01,1.599782371520996
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,4096,1536,8,128,8,2,balanced,1.077776034673055
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,4096,1536,8,128,8,2,power_law_1.01,0.10432640314102173
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,4096,1536,8,128,8,2,balanced,0.3489439884821574
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,4096,1536,8,128,8,2,power_law_1.01,1.8181312561035157
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,4096,1536,8,128,8,2,power_law_1.01,0.10877439975738526
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,4096,1536,8,128,8,2,power_law_1.01,0.12135679721832275
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,4096,1536,8,128,8,2,power_law_1.01,2.8337535858154297
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,4096,1536,8,128,8,2,balanced,0.41200534502665204
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,4096,1536,8,128,8,2,power_law_1.01,0.12817280292510985
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,4096,1536,8,128,8,2,power_law_1.01,0.1376255989074707
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,4096,1536,8,128,8,2,balanced,2.4884586334228516
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,4096,1536,8,128,8,2,power_law_1.01,0.16785279512405396
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,4096,1536,8,128,8,2,power_law_1.01,5.976326370239258
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,4096,1536,8,128,8,2,balanced,0.62062935034434
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,4096,1536,8,128,8,2,power_law_1.01,0.18398079872131348
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,4096,1536,8,128,8,2,power_law_1.01,0.21831040382385253
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,4096,1536,8,128,8,2,power_law_1.01,0.2652928113937378
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,4096,1536,8,128,8,2,power_law_1.01,0.35801599025726316
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,4096,1536,8,128,8,2,balanced,0.7597119808197021
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,4096,1536,8,128,8,2,balanced,1.432538668314616
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,4096,1536,8,128,8,2,power_law_1.01,0.4363711833953857
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,4096,1536,8,128,8,2,power_law_1.01,0.6252096176147461
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,4096,1536,8,128,8,2,power_law_1.01,0.8172032356262207
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,4096,1536,8,128,8,2,power_law_1.01,0.04444159865379334
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,4096,1536,8,128,8,2,power_law_1.01,1.1176063537597656
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,4096,1536,8,128,8,2,balanced,1.10807466506958
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,4096,1536,8,128,8,2,power_law_1.01,1.4756671905517578
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,4096,1536,8,128,8,2,power_law_1.01,0.04694400131702423
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,4096,1536,8,128,8,2,power_law_1.01,1.9657983779907227
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,4096,1536,8,128,8,2,power_law_1.01,0.05070080161094666
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,4096,1536,8,128,8,2,power_law_1.01,0.058924800157546996
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,4096,1536,8,128,8,2,power_law_1.01,2.9686336517333984
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,4096,1536,8,128,8,2,power_law_1.01,0.06693120002746582
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,4096,1536,8,128,8,2,balanced,1.4465279579162598
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,4096,1536,8,128,8,2,power_law_1.2,0.03927040100097656
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,4096,1536,8,128,8,2,power_law_1.01,0.08777599930763244
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,4096,1536,8,128,8,2,power_law_1.01,6.136851119995117
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,4096,1536,8,128,8,2,power_law_1.01,0.09233919978141784
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,4096,1536,8,128,8,2,balanced,1.7718772888183594
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,4096,1536,8,128,8,2,power_law_1.2,0.03934719860553741
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,4096,1536,8,128,8,2,power_law_1.01,0.09410560131072998
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,4096,1536,8,128,8,2,power_law_1.2,0.0470335990190506
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,4096,1536,8,128,8,2,power_law_1.01,0.09757440090179444
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,4096,1536,8,128,8,2,power_law_1.2,0.056966400146484374
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,4096,1536,8,128,8,2,power_law_1.01,0.10491520166397095
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,4096,1536,8,128,8,2,power_law_1.2,0.06422399878501892
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,4096,1536,8,128,8,2,power_law_1.01,0.11277439594268798
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,4096,1536,8,128,8,2,power_law_1.2,0.09192320108413696
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,4096,1536,8,128,8,2,balanced,2.1452266375223794
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,4096,1536,8,128,8,2,power_law_1.01,0.12223360538482667
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,4096,1536,8,128,8,2,power_law_1.2,0.09612799882888794
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,4096,1536,8,128,8,2,power_law_1.01,0.12880640029907225
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,4096,1536,8,128,8,2,power_law_1.2,0.10439039468765259
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,4096,1536,8,128,8,2,power_law_1.01,0.14058239459991456
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,4096,1536,8,128,8,2,power_law_1.2,0.10833920240402221
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,4096,1536,8,128,8,2,power_law_1.2,0.11275520324707031
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,4096,1536,8,128,8,2,power_law_1.2,0.12188800573348998
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,4096,1536,8,128,8,2,power_law_1.01,0.1556671977043152
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,4096,1536,8,128,8,2,power_law_1.01,0.1663424015045166
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,4096,1536,8,128,8,2,power_law_1.2,0.12559360265731812
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,4096,1536,8,128,8,2,balanced,2.844245274861654
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,4096,1536,8,128,8,2,balanced,4.864362716674805
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,4096,1536,8,128,8,2,power_law_1.2,0.13396480083465576
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,4096,1536,8,128,8,2,power_law_1.01,0.18391040563583375
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,4096,1536,8,128,8,2,power_law_1.2,0.13464319705963135
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,4096,1536,8,128,8,2,balanced,2.6748374303181968
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,4096,1536,8,128,8,2,power_law_1.01,0.23927040100097657
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,4096,1536,8,128,8,2,power_law_1.2,0.14190720319747924
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,4096,1536,8,128,8,2,power_law_1.2,0.1475711941719055
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,4096,1536,8,128,8,2,power_law_1.01,0.2973504066467285
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,4096,1536,8,128,8,2,power_law_1.2,0.16353919506072997
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,4096,1536,8,128,8,2,power_law_1.01,0.40018558502197266
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,4096,1536,8,128,8,2,power_law_1.2,0.2065471887588501
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,4096,1536,8,128,8,2,power_law_1.2,0.038950398564338684
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,4096,1536,8,128,8,2,power_law_1.01,0.4983039855957031
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,4096,1536,8,128,8,2,power_law_1.2,0.22388479709625245
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,4096,1536,8,128,8,2,power_law_1.2,0.035718399286270144
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,4096,1536,8,128,8,2,power_law_1.01,0.7128575801849365
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,4096,1536,8,128,8,2,balanced,3.5359252293904624
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,4096,1536,8,128,8,2,power_law_1.2,0.25861759185791017
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,4096,1536,8,128,8,2,power_law_1.2,0.04053759872913361
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,4096,1536,8,128,8,2,power_law_1.01,0.8950079917907715
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,4096,1536,8,128,8,2,power_law_1.2,0.29608960151672364
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,4096,1536,8,128,8,2,power_law_1.2,0.04784640073776245
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,4096,1536,8,128,8,2,power_law_1.01,1.2501503944396972
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,4096,1536,8,128,8,2,power_law_1.2,0.398905611038208
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,4096,1536,8,128,8,2,power_law_1.2,0.055667197704315184
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,4096,1536,8,128,8,2,power_law_1.01,1.7800128936767579
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,4096,1536,8,128,8,2,power_law_1.2,0.07697920203208923
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,4096,1536,8,128,8,2,power_law_1.2,0.45969281196594236
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,4096,1536,8,128,8,2,power_law_1.01,2.420128059387207
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,4096,1536,8,128,8,2,power_law_1.2,0.08190079927444457
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,4096,1536,8,128,8,2,power_law_1.2,0.6366079807281494
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,4096,1536,8,128,8,2,power_law_1.01,3.12161922454834
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,4096,1536,8,128,8,2,power_law_1.2,0.08510720133781433
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,4096,1536,8,128,8,2,power_law_1.2,0.8913536071777344
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,4096,1536,8,128,8,2,power_law_1.01,4.036563110351563
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,4096,1536,8,128,8,2,power_law_1.2,0.0890175998210907
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,4096,1536,8,128,8,2,power_law_1.2,1.230668830871582
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,4096,1536,8,128,8,2,power_law_1.2,0.08929280042648316
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,4096,1536,8,128,8,2,power_law_1.01,6.425331115722656
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,4096,1536,8,128,8,2,power_law_1.2,1.5640447616577149
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,4096,1536,8,128,8,2,power_law_1.2,0.09388800263404846
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,4096,1536,8,128,8,2,power_law_1.2,0.1031872034072876
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,4096,1536,8,128,8,2,power_law_1.2,2.004416084289551
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,4096,1536,8,128,8,2,power_law_1.01,13.08564453125
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,4096,1536,8,128,8,2,power_law_1.2,0.10641280412673951
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,4096,1536,8,128,8,2,power_law_1.2,3.5076351165771484
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,4096,1536,8,128,8,2,power_law_1.2,0.10980479717254639
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,4096,1536,8,128,8,2,balanced,5.63046391805013
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,4096,1536,8,128,8,2,power_law_1.2,0.11972479820251465
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,4096,1536,8,128,8,2,power_law_1.2,7.900511932373047
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,4096,1536,8,128,8,2,power_law_1.2,0.12887680530548096
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,4096,1536,8,128,8,2,power_law_1.2,0.14079359769821168
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,4096,1536,8,128,8,2,power_law_1.2,0.17004159688949586
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,4096,1536,8,128,8,2,power_law_1.2,0.1845695972442627
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,4096,1536,8,128,8,2,balanced,5.233914693196614
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,4096,1536,8,128,8,2,power_law_1.2,0.2323456048965454
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,4096,1536,8,128,8,2,power_law_1.2,0.27733120918273924
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,4096,1536,8,128,8,2,power_law_1.2,0.37868800163269045
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,4096,1536,8,128,8,2,power_law_1.2,0.46636161804199217
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,4096,1536,8,128,8,2,power_law_1.2,0.6622975826263428
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,4096,1536,8,128,8,2,power_law_1.2,0.8656767845153809
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,4096,1536,8,128,8,2,power_law_1.2,1.2563136100769043
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,4096,1536,8,128,8,2,power_law_1.2,1.5584832191467286
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,4096,1536,8,128,8,2,power_law_1.2,2.0422079086303713
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,4096,1536,8,128,8,2,power_law_1.2,3.068467140197754
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,4096,1536,8,128,8,2,power_law_1.2,6.382028961181641
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,4096,1536,8,128,8,2,balanced,11.113680521647135
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,4096,1536,8,128,8,2,power_law_1.2,0.04412800073623657
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,4096,1536,8,128,8,2,power_law_1.2,0.04769279956817627
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,4096,1536,8,128,8,2,power_law_1.2,0.05107839703559876
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,4096,1536,8,128,8,2,power_law_1.2,0.058208000659942624
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,4096,1536,8,128,8,2,power_law_1.2,0.06673920154571533
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,4096,1536,8,128,8,2,power_law_1.2,0.0884223997592926
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,4096,1536,8,128,8,2,power_law_1.2,0.09482880234718323
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,4096,1536,8,128,8,2,power_law_1.2,0.09586560130119323
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,4096,1536,8,128,8,2,power_law_1.2,0.09907199740409851
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,4096,1536,8,128,8,2,power_law_1.2,0.10646400451660157
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,4096,1536,8,128,8,2,power_law_1.2,0.11802879571914673
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,4096,1536,8,128,8,2,power_law_1.2,0.12283519506454468
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,4096,1536,8,128,8,2,power_law_1.2,0.13008639812469483
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,4096,1536,8,128,8,2,power_law_1.2,0.145305597782135
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,4096,1536,8,128,8,2,power_law_1.2,0.15356800556182862
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,4096,1536,8,128,16,1,balanced,0.045194665590922035
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,4096,1536,8,128,8,2,power_law_1.2,0.17373440265655518
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,4096,1536,8,128,16,1,balanced,0.04533333579699198
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,4096,1536,8,128,16,1,balanced,0.05649599929650625
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,4096,1536,8,128,8,2,power_law_1.2,0.18848639726638794
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,4096,1536,8,128,16,1,balanced,0.08258666594823201
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,4096,1536,8,128,8,2,power_law_1.2,0.23596160411834716
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,4096,1536,8,128,16,1,balanced,0.1286079982916514
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,4096,1536,8,128,8,2,power_law_1.2,0.2919680118560791
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,4096,1536,8,128,16,1,balanced,0.03757333258787791
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,4096,1536,8,128,16,1,balanced,0.1318186620871226
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,4096,1536,8,128,8,2,power_law_1.2,0.4187327861785889
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,4096,1536,8,128,16,1,balanced,0.13238400220870972
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,4096,1536,8,128,16,1,balanced,0.04050133377313614
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,4096,1536,8,128,8,2,power_law_1.2,0.5281280040740967
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,4096,1536,8,128,16,1,balanced,0.13287466764450073
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,4096,1536,8,128,16,1,balanced,0.04829333225886027
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,4096,1536,8,128,8,2,power_law_1.2,0.7613632202148437
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,4096,1536,8,128,16,1,balanced,0.07011733452479045
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,4096,1536,8,128,16,1,balanced,0.13554666439692178
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,4096,1536,8,128,8,2,power_law_1.2,0.9072383880615235
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,4096,1536,8,128,16,1,balanced,0.1039680043856303
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,4096,1536,8,128,16,1,balanced,0.13686933120091757
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,4096,1536,8,128,8,2,power_law_1.2,1.351148796081543
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,4096,1536,8,128,16,1,balanced,0.10635200142860413
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,4096,1536,8,128,8,2,power_law_1.2,1.7939584732055665
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,4096,1536,8,128,16,1,balanced,0.13988799850145975
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,4096,1536,8,128,16,1,balanced,0.10784000158309937
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,4096,1536,8,128,8,2,power_law_1.2,2.8218368530273437
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,4096,1536,8,128,16,1,balanced,0.1450506647427877
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,4096,1536,8,128,16,1,balanced,0.1083733340104421
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,4096,1536,8,128,8,2,power_law_1.2,3.6510848999023438
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,4096,1536,8,128,16,1,balanced,0.11083199580510457
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,4096,1536,8,128,16,1,balanced,0.14677332838376364
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,4096,1536,8,128,16,1,balanced,0.1120853324731191
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,4096,1536,8,128,8,2,power_law_1.2,4.51599349975586
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,4096,1536,8,128,16,1,balanced,0.15230400363604227
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,4096,1536,8,128,16,1,balanced,0.11498133341471355
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,4096,1536,8,128,8,2,power_law_1.2,6.725433349609375
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,4096,1536,8,128,16,1,balanced,0.11787733435630798
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,4096,1536,8,128,16,1,balanced,0.15942399700482687
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,4096,1536,8,128,16,1,balanced,0.12168533603350322
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,4096,1536,8,128,16,1,balanced,0.16461333632469177
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,4096,1536,8,128,16,1,balanced,0.13108799854914346
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,4096,1536,8,128,8,2,power_law_1.2,14.624313354492188
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,4096,1536,8,128,16,1,balanced,0.18877333402633667
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,4096,1536,8,128,16,1,balanced,0.14231999715169272
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,4096,1536,8,128,16,1,balanced,0.1508693297704061
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,4096,1536,8,128,16,1,balanced,0.21867199738820395
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,4096,1536,8,128,16,1,balanced,0.17413866519927979
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,4096,1536,8,128,16,1,balanced,0.24794133504231772
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,4096,1536,8,128,16,1,balanced,0.1982240080833435
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,4096,1536,8,128,16,1,balanced,0.2199359933535258
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,4096,1536,8,128,16,1,balanced,0.28946133454640705
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,4096,1536,8,128,16,1,balanced,0.2703626751899719
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,4096,1536,8,128,16,1,balanced,0.3213760058085124
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,4096,1536,8,128,16,1,balanced,0.3187040090560913
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,4096,1536,8,128,16,1,balanced,0.5066560109456381
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,4096,1536,8,128,16,1,balanced,0.482752005259196
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,4096,1536,8,128,16,1,balanced,0.5859839916229248
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,4096,1536,8,128,16,1,balanced,0.5805600086847941
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,4096,1536,8,128,16,1,balanced,0.9298880100250244
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,4096,1536,8,128,16,1,balanced,0.9046506881713867
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,4096,1536,8,128,16,1,power_law_1.01,0.03947519958019256
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,4096,1536,8,128,16,1,power_law_1.01,0.035571199655532834
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,4096,1536,8,128,16,1,power_law_1.01,0.04019840061664581
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,4096,1536,8,128,16,1,power_law_1.01,0.04842239916324616
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,4096,1536,8,128,16,1,power_law_1.01,0.03783040046691895
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,4096,1536,8,128,16,1,power_law_1.01,0.06467840075492859
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,4096,1536,8,128,16,1,power_law_1.01,0.0456063985824585
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,4096,1536,8,128,16,1,balanced,1.2471360365549724
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,4096,1536,8,128,16,1,balanced,1.2352320353190105
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,4096,1536,8,128,16,1,power_law_1.01,0.0834176003932953
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,4096,1536,8,128,16,1,power_law_1.01,0.05589759945869446
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,4096,1536,8,128,16,1,power_law_1.01,0.11351679563522339
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,4096,1536,8,128,16,1,power_law_1.01,0.06687359809875489
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,4096,1536,8,128,16,1,power_law_1.01,0.11841280460357666
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,4096,1536,8,128,16,1,power_law_1.01,0.09215999841690063
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,4096,1536,8,128,16,1,power_law_1.01,0.12239999771118164
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,4096,1536,8,128,16,1,power_law_1.01,0.09801599979400635
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,4096,1536,8,128,16,1,power_law_1.01,0.10124800205230713
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,4096,1536,8,128,16,1,power_law_1.01,0.1300160050392151
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,4096,1536,8,128,16,1,power_law_1.01,0.10695680379867553
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,4096,1536,8,128,16,1,balanced,1.8785546620686848
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,4096,1536,8,128,16,1,power_law_1.01,0.13219840526580812
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,4096,1536,8,128,16,1,balanced,1.8847999572753906
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,4096,1536,8,128,16,1,power_law_1.01,0.11163519620895386
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,4096,1536,8,128,16,1,power_law_1.01,0.14117759466171265
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,4096,1536,8,128,16,1,power_law_1.01,0.1205888032913208
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,4096,1536,8,128,16,1,power_law_1.01,0.162118399143219
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,4096,1536,8,128,16,1,power_law_1.01,0.1288256049156189
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,4096,1536,8,128,16,1,power_law_1.01,0.17878400087356566
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,4096,1536,8,128,16,1,power_law_1.01,0.13740160465240478
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,4096,1536,8,128,16,1,power_law_1.01,0.16846079826354982
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,4096,1536,8,128,16,1,power_law_1.01,0.17844480276107788
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,4096,1536,8,128,16,1,power_law_1.01,0.14171520471572877
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,4096,1536,8,128,16,1,power_law_1.01,0.19360640048980712
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,4096,1536,8,128,16,1,power_law_1.01,0.1544000029563904
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,4096,1536,8,128,16,1,power_law_1.01,0.2120896100997925
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,4096,1536,8,128,16,1,balanced,2.3897387186686196
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,4096,1536,8,128,16,1,power_law_1.01,0.1652735948562622
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,4096,1536,8,128,16,1,balanced,2.5014293988545737
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,4096,1536,8,128,16,1,power_law_1.01,0.26216959953308105
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,4096,1536,8,128,16,1,power_law_1.01,0.1835968017578125
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,4096,1536,8,128,16,1,power_law_1.01,0.3058687925338745
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,4096,1536,8,128,16,1,power_law_1.01,0.21249279975891114
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,4096,1536,8,128,16,1,power_law_1.01,0.34971520900726316
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,4096,1536,8,128,16,1,power_law_1.01,0.2565824031829834
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,4096,1536,8,128,16,1,power_law_1.01,0.4341887950897217
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,4096,1536,8,128,16,1,power_law_1.01,0.3143872022628784
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,4096,1536,8,128,16,1,power_law_1.2,0.0383103996515274
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,4096,1536,8,128,16,1,power_law_1.01,0.564185619354248
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,4096,1536,8,128,16,1,power_law_1.01,0.3757055997848511
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,4096,1536,8,128,16,1,power_law_1.01,0.6987904071807861
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,4096,1536,8,128,16,1,power_law_1.2,0.04154239892959595
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,4096,1536,8,128,16,1,power_law_1.01,0.5093503952026367
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,4096,1536,8,128,16,1,power_law_1.2,0.048127999901771544
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,4096,1536,8,128,16,1,power_law_1.01,0.9659968376159668
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,4096,1536,8,128,16,1,power_law_1.01,0.6452991962432861
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,4096,1536,8,128,16,1,balanced,2.9663893381754556
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,4096,1536,8,128,16,1,power_law_1.2,0.06051200032234192
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,4096,1536,8,128,16,1,power_law_1.01,0.9145664215087891
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,4096,1536,8,128,16,1,power_law_1.01,1.2591744422912599
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,4096,1536,8,128,16,1,balanced,3.1378294626871743
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,4096,1536,8,128,16,1,power_law_1.2,0.07953919768333435
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,4096,1536,8,128,16,1,power_law_1.01,1.1923904418945312
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,4096,1536,8,128,16,1,power_law_1.01,1.8170560836791991
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,4096,1536,8,128,16,1,power_law_1.2,0.11148799657821655
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,4096,1536,8,128,16,1,power_law_1.01,1.7676416397094727
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,4096,1536,8,128,16,1,power_law_1.01,2.390067291259766
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,4096,1536,8,128,16,1,power_law_1.2,0.12194559574127198
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,4096,1536,8,128,16,1,power_law_1.01,2.3235647201538088
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,4096,1536,8,128,16,1,power_law_1.2,0.12807680368423463
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,4096,1536,8,128,16,1,power_law_1.01,3.002835273742676
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,4096,1536,8,128,16,1,power_law_1.2,0.13477120399475098
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,4096,1536,8,128,16,1,power_law_1.01,2.871449661254883
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,4096,1536,8,128,16,1,power_law_1.01,4.665171051025391
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,4096,1536,8,128,16,1,power_law_1.2,0.13640960454940795
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,4096,1536,8,128,16,1,power_law_1.2,0.1445631980895996
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,4096,1536,8,128,16,1,power_law_1.01,4.691507339477539
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,4096,1536,8,128,16,1,power_law_1.2,0.1677183985710144
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,4096,1536,8,128,16,1,power_law_1.01,9.987929534912109
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,4096,1536,8,128,16,1,power_law_1.2,0.17790720462799073
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,4096,1536,8,128,16,1,power_law_1.2,0.1693567991256714
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,4096,1536,8,128,16,1,power_law_1.01,9.81377944946289
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,4096,1536,8,128,16,1,power_law_1.2,0.1806272029876709
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,4096,1536,8,128,16,1,power_law_1.2,0.19289599657058715
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,4096,1536,8,128,16,1,power_law_1.2,0.21430399417877197
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,4096,1536,8,128,16,1,balanced,4.687146822611491
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,4096,1536,8,128,16,1,power_law_1.2,0.2661695957183838
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,4096,1536,8,128,16,1,power_law_1.2,0.3077183961868286
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,4096,1536,8,128,16,1,balanced,4.775269190470378
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,4096,1536,8,128,16,1,power_law_1.2,0.3694976091384888
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,4096,1536,8,128,16,1,power_law_1.2,0.43811841011047364
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,4096,1536,8,128,16,1,power_law_1.2,0.5666687965393067
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,4096,1536,8,128,16,1,power_law_1.2,0.7030208110809326
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,4096,1536,8,128,16,1,power_law_1.2,0.9765055656433106
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,4096,1536,8,128,16,1,power_law_1.2,1.2732159614562988
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,4096,1536,8,128,16,1,power_law_1.2,1.8415231704711914
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,4096,1536,8,128,16,1,power_law_1.2,2.411187171936035
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,4096,1536,8,128,16,1,power_law_1.2,3.006835174560547
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,4096,1536,8,128,16,1,power_law_1.2,4.963552093505859
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,4096,1536,8,128,16,1,power_law_1.2,10.165042877197266
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,4096,1536,8,128,16,1,power_law_1.2,0.035699200630187986
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,4096,1536,8,128,16,1,power_law_1.2,0.03792639970779419
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,4096,1536,8,128,16,1,power_law_1.2,0.04325760006904602
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,4096,1536,8,128,16,1,power_law_1.2,0.05438079833984375
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,4096,1536,8,128,16,1,power_law_1.2,0.06235520243644714
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,4096,1536,8,128,16,1,power_law_1.2,0.09292160272598267
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,4096,1536,8,128,16,1,balanced,9.729967753092447
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,4096,1536,8,128,16,1,power_law_1.2,0.09806720018386841
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,4096,1536,8,128,16,1,power_law_1.2,0.10240000486373901
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,4096,1536,8,128,16,1,balanced,9.344682693481445
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,4096,1536,8,128,16,1,power_law_1.2,0.10871039628982544
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,4096,1536,8,128,16,1,power_law_1.2,0.11760640144348145
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,4096,1536,8,128,16,1,power_law_1.2,0.12339839935302735
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,4096,1536,8,128,16,1,power_law_1.2,0.13227519989013672
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,4096,1536,8,128,16,1,power_law_1.2,0.1384703993797302
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,4096,1536,8,128,16,1,power_law_1.2,0.14388480186462402
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,4096,1536,8,128,16,1,power_law_1.2,0.15675519704818724
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,4096,1536,8,128,16,1,power_law_1.2,0.1694591999053955
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,4096,1536,8,128,16,1,power_law_1.2,0.18712960481643676
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,4096,1536,8,128,16,1,power_law_1.2,0.21822719573974608
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,4096,1536,8,128,16,1,power_law_1.2,0.25985920429229736
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,4096,1536,8,128,16,1,power_law_1.2,0.31943039894104003
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,4096,1536,8,128,16,1,power_law_1.2,0.37846400737762453
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,4096,1536,8,128,16,1,power_law_1.2,0.5141056060791016
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,4096,1536,8,128,16,1,power_law_1.2,0.6521408081054687
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,4096,1536,8,128,16,1,power_law_1.2,0.9194496154785157
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,4096,1536,8,128,16,1,power_law_1.2,1.2076288223266602
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,4096,1536,8,128,16,1,power_law_1.2,1.8060287475585937
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,4096,1536,8,128,16,1,power_law_1.2,2.3565952301025392
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,4096,1536,8,128,16,1,power_law_1.2,2.9593151092529295
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,4096,1536,8,128,16,1,power_law_1.2,4.835980987548828
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,4096,1536,8,128,16,1,power_law_1.2,9.884793853759765
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,6144,2560,8,160,1,16,balanced,0.07733866572380066
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,6144,2560,8,160,1,16,balanced,0.07120533287525177
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,6144,2560,8,160,1,16,balanced,0.08634666601816814
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,6144,2560,8,160,1,16,balanced,0.12828266620635986
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,6144,2560,8,160,1,16,balanced,0.22986666361490884
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,6144,2560,8,160,1,16,balanced,0.26126400629679364
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,6144,2560,8,160,1,16,balanced,0.2662506699562073
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,6144,2560,8,160,1,16,balanced,0.2625173330307007
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,6144,2560,8,160,1,16,balanced,0.059664001067479454
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,6144,2560,8,160,1,16,balanced,0.26393600304921466
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,6144,2560,8,160,1,16,balanced,0.05880533158779144
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,6144,2560,8,160,1,16,balanced,0.26314133405685425
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,6144,2560,8,160,1,16,balanced,0.06429333488146464
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,6144,2560,8,160,1,16,balanced,0.26582932472229004
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,6144,2560,8,160,1,16,balanced,0.09330133597056071
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,6144,2560,8,160,1,16,balanced,0.2661760052045186
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,6144,2560,8,160,1,16,balanced,0.1350826621055603
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,6144,2560,8,160,1,16,balanced,0.26710933446884155
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,6144,2560,8,160,1,16,balanced,0.15934933225313822
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,6144,2560,8,160,1,16,balanced,0.27221866448720294
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,6144,2560,8,160,1,16,balanced,0.16049066185951233
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,6144,2560,8,160,1,16,balanced,0.16243199507395426
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,6144,2560,8,160,1,16,balanced,0.27561599016189575
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,6144,2560,8,160,1,16,balanced,0.1634986698627472
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,6144,2560,8,160,1,16,balanced,0.050767997900644936
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,6144,2560,8,160,1,16,balanced,0.2927359938621521
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,6144,2560,8,160,1,16,balanced,0.16390400131543478
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,6144,2560,8,160,1,16,balanced,0.04937600096066793
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,6144,2560,8,160,1,16,balanced,0.2961759964625041
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,6144,2560,8,160,1,16,balanced,0.16661333044370016
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,6144,2560,8,160,1,16,balanced,0.1660160024960836
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,6144,2560,8,160,1,16,balanced,0.06301866471767426
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,6144,2560,8,160,1,16,balanced,0.31728533903757733
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,6144,2560,8,160,1,16,balanced,0.16750933726628622
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,6144,2560,8,160,1,16,balanced,0.09619733691215515
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,6144,2560,8,160,1,16,balanced,0.3163253267606099
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,6144,2560,8,160,1,16,balanced,0.17012800772984824
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,6144,2560,8,160,1,16,balanced,0.13329066832860312
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,6144,2560,8,160,1,16,balanced,0.1762239933013916
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,6144,2560,8,160,1,16,balanced,0.1605280041694641
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,6144,2560,8,160,1,16,balanced,0.39073065916697186
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,6144,2560,8,160,1,16,balanced,0.1943626602490743
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,6144,2560,8,160,1,16,balanced,0.16365866859753928
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,6144,2560,8,160,1,16,balanced,0.18481600284576416
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,6144,2560,8,160,1,16,balanced,0.16222932934761047
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,6144,2560,8,160,1,16,balanced,0.35444800059000653
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,6144,2560,8,160,1,16,balanced,0.16350932916005453
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,6144,2560,8,160,1,16,balanced,0.2225066622098287
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,6144,2560,8,160,1,16,balanced,0.16542933384577432
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,6144,2560,8,160,1,16,balanced,0.5532053311665853
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,6144,2560,8,160,1,16,balanced,0.20719999074935913
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,6144,2560,8,160,1,16,balanced,0.16870933771133423
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,6144,2560,8,160,1,16,power_law_1.01,0.22236158847808837
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,6144,2560,8,160,1,16,balanced,0.16740800937016806
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,6144,2560,8,160,1,16,balanced,0.25633599360783893
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,6144,2560,8,160,1,16,power_law_1.01,0.25601921081542967
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,6144,2560,8,160,1,16,balanced,0.17045867443084717
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,6144,2560,8,160,1,16,balanced,0.48476799329121906
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,6144,2560,8,160,1,16,power_law_1.01,0.11215360164642334
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,6144,2560,8,160,1,16,balanced,0.17309866348902384
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,6144,2560,8,160,1,16,power_law_1.01,0.13672959804534912
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,6144,2560,8,160,1,16,balanced,0.2550666729609172
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,6144,2560,8,160,1,16,power_law_1.01,0.18744319677352905
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,6144,2560,8,160,1,16,balanced,0.17825599511464438
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,6144,2560,8,160,1,16,power_law_1.01,0.24466559886932374
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,6144,2560,8,160,1,16,balanced,0.3744320074717204
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,6144,2560,8,160,1,16,power_law_1.01,0.24484479427337646
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,6144,2560,8,160,1,16,balanced,0.8972000281016032
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,6144,2560,8,160,1,16,power_law_1.01,0.25081601142883303
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,6144,2560,8,160,1,16,power_law_1.01,0.14693119525909423
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,6144,2560,8,160,1,16,power_law_1.01,0.25039360523223875
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,6144,2560,8,160,1,16,power_law_1.01,0.16192640066146852
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,6144,2560,8,160,1,16,balanced,0.3656373421351115
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,6144,2560,8,160,1,16,power_law_1.01,0.26384639739990234
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,6144,2560,8,160,1,16,balanced,0.1830986738204956
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,6144,2560,8,160,1,16,power_law_1.01,0.07422720193862915
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,6144,2560,8,160,1,16,power_law_1.01,0.27701759338378906
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,6144,2560,8,160,1,16,balanced,0.86408003171285
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,6144,2560,8,160,1,16,power_law_1.01,0.09505280256271362
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,6144,2560,8,160,1,16,power_law_1.01,0.28115200996398926
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,6144,2560,8,160,1,16,power_law_1.01,0.1117184042930603
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,6144,2560,8,160,1,16,power_law_1.01,0.28654720783233645
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,6144,2560,8,160,1,16,balanced,0.6157279809316
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,6144,2560,8,160,1,16,power_law_1.01,0.14691840410232543
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,6144,2560,8,160,1,16,power_law_1.01,0.28650879859924316
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,6144,2560,8,160,1,16,power_law_1.01,0.13904000520706178
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,6144,2560,8,160,1,16,power_law_1.01,0.3122431993484497
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,6144,2560,8,160,1,16,balanced,0.19022399187088013
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,6144,2560,8,160,1,16,power_law_1.01,0.15512319803237914
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,6144,2560,8,160,1,16,power_law_1.01,0.34396800994873045
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,6144,2560,8,160,1,16,power_law_1.01,0.15588480234146118
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,6144,2560,8,160,1,16,power_law_1.01,0.35783679485321046
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,6144,2560,8,160,1,16,balanced,1.488474686940511
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,6144,2560,8,160,1,16,power_law_1.01,0.1609984040260315
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,6144,2560,8,160,1,16,balanced,0.6388586759567261
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,6144,2560,8,160,1,16,power_law_1.01,0.4011648178100586
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,6144,2560,8,160,1,16,power_law_1.01,0.41777920722961426
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,6144,2560,8,160,1,16,power_law_1.01,0.1711359977722168
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,6144,2560,8,160,1,16,power_law_1.01,0.5622079849243165
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,6144,2560,8,160,1,16,power_law_1.01,0.16862720251083374
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,6144,2560,8,160,1,16,power_law_1.01,0.13605120182037353
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,6144,2560,8,160,1,16,power_law_1.01,0.5201087951660156
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,6144,2560,8,160,1,16,power_law_1.01,0.17027839422225952
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,6144,2560,8,160,1,16,power_law_1.01,0.6928575992584228
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,6144,2560,8,160,1,16,power_law_1.01,0.19367680549621583
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,6144,2560,8,160,1,16,power_law_1.01,0.15356800556182862
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,6144,2560,8,160,1,16,balanced,0.20217067003250122
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,6144,2560,8,160,1,16,power_law_1.01,0.9395392417907715
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,6144,2560,8,160,1,16,power_law_1.01,0.21548159122467042
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,6144,2560,8,160,1,16,power_law_1.01,0.0800704002380371
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,6144,2560,8,160,1,16,power_law_1.01,1.2545599937438965
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,6144,2560,8,160,1,16,balanced,0.21527999639511108
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,6144,2560,8,160,1,16,balanced,0.8432693481445312
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,6144,2560,8,160,1,16,power_law_1.01,0.22249600887298585
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,6144,2560,8,160,1,16,power_law_1.01,0.0958400011062622
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,6144,2560,8,160,1,16,power_law_1.01,1.6315391540527344
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,6144,2560,8,160,1,16,balanced,1.4250987370808919
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,6144,2560,8,160,1,16,power_law_1.01,0.21950719356536866
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,6144,2560,8,160,1,16,power_law_1.01,0.1167680025100708
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,6144,2560,8,160,1,16,power_law_1.01,2.180384063720703
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,6144,2560,8,160,1,16,power_law_1.01,0.28051199913024905
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,6144,2560,8,160,1,16,power_law_1.01,0.15024640560150146
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,6144,2560,8,160,1,16,power_law_1.01,2.5234048843383787
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,6144,2560,8,160,1,16,power_law_1.01,0.2760576009750366
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,6144,2560,8,160,1,16,power_law_1.01,0.14557440280914308
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,6144,2560,8,160,1,16,power_law_1.01,3.103603172302246
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,6144,2560,8,160,1,16,power_law_1.01,0.33792641162872317
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,6144,2560,8,160,1,16,power_law_1.01,0.14814720153808594
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,6144,2560,8,160,1,16,power_law_1.01,0.35489280223846437
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,6144,2560,8,160,1,16,power_law_1.01,4.854969787597656
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,6144,2560,8,160,1,16,power_law_1.01,0.15299199819564818
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,6144,2560,8,160,1,16,power_law_1.01,0.45238399505615234
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,6144,2560,8,160,1,16,balanced,0.24581333001454672
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,6144,2560,8,160,1,16,power_law_1.01,0.15953279733657838
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,6144,2560,8,160,1,16,balanced,1.0860106945037842
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,6144,2560,8,160,1,16,power_law_1.01,10.778182220458984
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,6144,2560,8,160,1,16,power_law_1.01,0.6322112083435059
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,6144,2560,8,160,1,16,power_law_1.01,0.16486400365829468
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,6144,2560,8,160,1,16,balanced,0.2672800024350484
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,6144,2560,8,160,1,16,power_law_1.01,0.8770943641662597
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,6144,2560,8,160,1,16,power_law_1.01,0.18568960428237916
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,6144,2560,8,160,1,16,balanced,1.696623961130778
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,6144,2560,8,160,1,16,power_law_1.01,1.0715392112731934
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,6144,2560,8,160,1,16,power_law_1.01,0.1974720001220703
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,6144,2560,8,160,1,16,power_law_1.01,0.22147200107574463
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,6144,2560,8,160,1,16,power_law_1.01,1.5477567672729493
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,6144,2560,8,160,1,16,power_law_1.01,0.22892799377441406
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,6144,2560,8,160,1,16,power_law_1.01,1.6801792144775392
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,6144,2560,8,160,1,16,balanced,0.3807733456293742
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,6144,2560,8,160,1,16,power_law_1.01,2.2468288421630858
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,6144,2560,8,160,1,16,power_law_1.2,0.2278592109680176
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,6144,2560,8,160,1,16,power_law_1.01,0.22055680751800538
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,6144,2560,8,160,1,16,balanced,0.43516798814137775
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,6144,2560,8,160,1,16,power_law_1.01,3.5868030548095704
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,6144,2560,8,160,1,16,power_law_1.2,0.11434880495071412
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,6144,2560,8,160,1,16,balanced,1.295898675918579
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,6144,2560,8,160,1,16,power_law_1.2,0.11594879627227783
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,6144,2560,8,160,1,16,power_law_1.01,0.24516479969024657
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,6144,2560,8,160,1,16,power_law_1.01,7.181446075439453
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,6144,2560,8,160,1,16,power_law_1.2,0.13668479919433593
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,6144,2560,8,160,1,16,power_law_1.2,0.16253440380096434
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,6144,2560,8,160,1,16,power_law_1.2,0.23160960674285888
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,6144,2560,8,160,1,16,power_law_1.01,0.2733439922332764
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,6144,2560,8,160,1,16,balanced,0.628378669420878
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,6144,2560,8,160,1,16,power_law_1.2,0.2499135971069336
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,6144,2560,8,160,1,16,power_law_1.01,0.3230783939361572
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,6144,2560,8,160,1,16,power_law_1.2,0.2534976005554199
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,6144,2560,8,160,1,16,balanced,2.6392480532328286
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,6144,2560,8,160,1,16,power_law_1.2,0.25588479042053225
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,6144,2560,8,160,1,16,power_law_1.01,0.3892287969589233
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,6144,2560,8,160,1,16,power_law_1.2,0.24410879611968994
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,6144,2560,8,160,1,16,power_law_1.01,0.49183359146118166
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,6144,2560,8,160,1,16,balanced,0.8429013093312582
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,6144,2560,8,160,1,16,power_law_1.2,0.2872767925262451
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,6144,2560,8,160,1,16,power_law_1.2,0.3021888017654419
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,6144,2560,8,160,1,16,power_law_1.01,0.5852543830871582
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,6144,2560,8,160,1,16,power_law_1.2,0.14358400106430053
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,6144,2560,8,160,1,16,power_law_1.2,0.2913727998733521
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,6144,2560,8,160,1,16,power_law_1.01,0.7967360019683838
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,6144,2560,8,160,1,16,power_law_1.2,0.08580480217933655
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,6144,2560,8,160,1,16,power_law_1.2,0.3189568042755127
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,6144,2560,8,160,1,16,balanced,2.00983460744222
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,6144,2560,8,160,1,16,power_law_1.2,0.07292159795761108
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,6144,2560,8,160,1,16,power_law_1.2,0.32108800411224364
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,6144,2560,8,160,1,16,power_law_1.2,0.09463040232658386
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,6144,2560,8,160,1,16,power_law_1.01,1.1763903617858886
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,6144,2560,8,160,1,16,power_law_1.2,0.34800000190734864
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,6144,2560,8,160,1,16,power_law_1.2,0.11079039573669433
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,6144,2560,8,160,1,16,balanced,1.1523626645406086
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,6144,2560,8,160,1,16,power_law_1.2,0.1468287944793701
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,6144,2560,8,160,1,16,power_law_1.01,1.6372735977172852
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,6144,2560,8,160,1,16,power_law_1.2,0.36726400852203367
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,6144,2560,8,160,1,16,power_law_1.2,0.1452288031578064
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,6144,2560,8,160,1,16,power_law_1.2,0.46555519104003906
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,6144,2560,8,160,1,16,power_law_1.2,0.15324800014495848
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,6144,2560,8,160,1,16,power_law_1.01,2.210771179199219
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,6144,2560,8,160,1,16,power_law_1.2,0.4945216178894043
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,6144,2560,8,160,1,16,power_law_1.2,0.15278719663619994
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,6144,2560,8,160,1,16,power_law_1.2,0.664518404006958
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,6144,2560,8,160,1,16,power_law_1.2,0.16569600105285645
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,6144,2560,8,160,1,16,power_law_1.01,2.945318412780762
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,6144,2560,8,160,1,16,power_law_1.2,0.16255999803543092
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,6144,2560,8,160,1,16,power_law_1.2,0.6224319934844971
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,6144,2560,8,160,1,16,power_law_1.2,0.17290879487991334
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,6144,2560,8,160,1,16,power_law_1.01,3.7906112670898438
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,6144,2560,8,160,1,16,power_law_1.2,0.18202879428863525
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,6144,2560,8,160,1,16,power_law_1.2,0.7054143905639648
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,6144,2560,8,160,1,16,power_law_1.2,0.21161599159240724
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,6144,2560,8,160,1,16,power_law_1.2,1.1494527816772462
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,6144,2560,8,160,1,16,balanced,1.5217599868774414
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,6144,2560,8,160,1,16,power_law_1.01,6.616915130615235
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,6144,2560,8,160,1,16,power_law_1.2,0.23170559406280516
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,6144,2560,8,160,1,16,power_law_1.2,0.25382399559020996
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,6144,2560,8,160,1,16,power_law_1.2,1.5470335960388184
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,6144,2560,8,160,1,16,power_law_1.2,0.24571518898010253
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,6144,2560,8,160,1,16,power_law_1.2,0.29923200607299805
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,6144,2560,8,160,1,16,power_law_1.01,12.4417724609375
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,6144,2560,8,160,1,16,power_law_1.2,2.2388288497924806
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,6144,2560,8,160,1,16,power_law_1.2,0.31712000370025634
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,6144,2560,8,160,1,16,power_law_1.2,0.41127681732177734
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,6144,2560,8,160,1,16,power_law_1.2,3.0893695831298826
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,6144,2560,8,160,1,16,power_law_1.2,0.44312319755554197
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,6144,2560,8,160,1,16,power_law_1.2,2.9968576431274414
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,6144,2560,8,160,1,16,power_law_1.2,0.5751359939575196
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,6144,2560,8,160,1,16,power_law_1.2,0.7390463829040528
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,6144,2560,8,160,1,16,power_law_1.2,5.081919860839844
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,6144,2560,8,160,1,16,power_law_1.2,1.0261823654174804
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,6144,2560,8,160,1,16,power_law_1.2,1.4294400215148926
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,6144,2560,8,160,1,16,power_law_1.2,8.72194595336914
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,6144,2560,8,160,1,16,balanced,1.827397346496582
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,6144,2560,8,160,1,16,power_law_1.2,1.8473791122436523
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,6144,2560,8,160,1,16,balanced,5.343727747599284
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,6144,2560,8,160,1,16,power_law_1.2,2.569196891784668
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,6144,2560,8,160,1,16,power_law_1.2,3.5760833740234377
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,6144,2560,8,160,1,16,power_law_1.2,19.153701782226562
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,6144,2560,8,160,1,16,power_law_1.2,6.3162494659423825
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,6144,2560,8,160,1,16,power_law_1.2,10.869574737548827
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,6144,2560,8,160,1,16,balanced,3.974266688028971
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,6144,2560,8,160,1,16,balanced,2.915797233581543
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,6144,2560,8,160,1,16,power_law_1.2,0.1378432035446167
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,6144,2560,8,160,1,16,power_law_1.2,0.08373119831085205
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,6144,2560,8,160,1,16,balanced,5.772373199462891
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,6144,2560,8,160,1,16,power_law_1.2,0.07735040187835693
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,6144,2560,8,160,1,16,power_law_1.2,0.09288319945335388
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,6144,2560,8,160,1,16,power_law_1.2,0.10338560342788697
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,6144,2560,8,160,1,16,power_law_1.2,0.14058239459991456
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,6144,2560,8,160,1,16,power_law_1.2,0.1407487988471985
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,6144,2560,8,160,1,16,power_law_1.2,0.15345280170440673
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,6144,2560,8,160,2,8,balanced,0.06000000238418579
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,6144,2560,8,160,1,16,power_law_1.2,0.15697920322418213
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,6144,2560,8,160,2,8,balanced,0.06311466793219249
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,6144,2560,8,160,1,16,power_law_1.2,0.16615040302276612
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,6144,2560,8,160,2,8,balanced,0.08585600058237712
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,6144,2560,8,160,1,16,power_law_1.2,0.18472959995269775
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,6144,2560,8,160,2,8,balanced,0.1284213364124298
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,6144,2560,8,160,1,16,power_law_1.2,0.18317439556121826
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,6144,2560,8,160,2,8,balanced,0.2336533268292745
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,6144,2560,8,160,1,16,power_law_1.2,0.20293760299682617
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,6144,2560,8,160,2,8,balanced,0.2815306584040324
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,6144,2560,8,160,2,8,balanced,0.27778132756551105
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,6144,2560,8,160,1,16,power_law_1.2,0.22181119918823242
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,6144,2560,8,160,2,8,balanced,0.2637866735458374
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,6144,2560,8,160,1,16,power_law_1.2,0.2524991989135742
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,6144,2560,8,160,2,8,balanced,0.26494399706522626
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,6144,2560,8,160,2,8,balanced,0.2658933401107788
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,6144,2560,8,160,2,8,balanced,0.26739199956258136
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,6144,2560,8,160,1,16,power_law_1.2,0.24942080974578856
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,6144,2560,8,160,2,8,balanced,0.2692799965540568
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,6144,2560,8,160,2,8,balanced,0.27086400985717773
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,6144,2560,8,160,2,8,balanced,0.2723520000775655
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,6144,2560,8,160,1,16,power_law_1.2,0.27063679695129395
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,6144,2560,8,160,2,8,balanced,0.27934932708740234
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,6144,2560,8,160,2,8,balanced,0.30088533957799274
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,6144,2560,8,160,1,16,power_law_1.2,0.30788478851318357
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,6144,2560,8,160,2,8,balanced,0.3001120090484619
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,6144,2560,8,160,1,16,power_law_1.2,0.3373183965682983
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,6144,2560,8,160,2,8,balanced,0.3277119994163513
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,6144,2560,8,160,2,8,balanced,0.3230560024579366
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,6144,2560,8,160,1,16,power_law_1.2,0.41510400772094724
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,6144,2560,8,160,2,8,balanced,0.3969279925028483
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,6144,2560,8,160,1,16,power_law_1.2,0.5781311988830566
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,6144,2560,8,160,2,8,balanced,0.36963733037312824
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,6144,2560,8,160,2,8,balanced,0.049029335379600525
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,6144,2560,8,160,1,16,power_law_1.2,0.7212607860565186
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,6144,2560,8,160,2,8,balanced,0.05217066903909048
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,6144,2560,8,160,1,16,power_law_1.2,0.9360511779785157
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,6144,2560,8,160,2,8,balanced,0.5648106733957926
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,6144,2560,8,160,2,8,balanced,0.06483200192451477
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,6144,2560,8,160,2,8,balanced,0.09513599673906963
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,6144,2560,8,160,2,8,balanced,0.13503999511400858
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,6144,2560,8,160,1,16,power_law_1.2,1.442144012451172
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,6144,2560,8,160,2,8,balanced,0.5036906798680624
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,6144,2560,8,160,2,8,balanced,0.16116799910863241
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,6144,2560,8,160,1,16,power_law_1.2,2.2119232177734376
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,6144,2560,8,160,2,8,balanced,0.16309332847595215
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,6144,2560,8,160,2,8,balanced,0.16405866543451944
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,6144,2560,8,160,1,16,power_law_1.2,3.346873474121094
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,6144,2560,8,160,2,8,balanced,0.16683733463287354
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,6144,2560,8,160,2,8,balanced,0.8981813589731852
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,6144,2560,8,160,2,8,balanced,0.16658133268356323
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,6144,2560,8,160,1,16,power_law_1.2,4.338860702514649
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,6144,2560,8,160,2,8,balanced,0.16874667008717856
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,6144,2560,8,160,1,16,power_law_1.2,4.932729721069336
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,6144,2560,8,160,2,8,balanced,0.16962667306264242
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,6144,2560,8,160,2,8,balanced,0.1717546582221985
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,6144,2560,8,160,2,8,balanced,0.8823413054148356
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,6144,2560,8,160,1,16,power_law_1.2,9.714713287353515
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,6144,2560,8,160,2,8,balanced,0.17467200756072998
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,6144,2560,8,160,2,8,power_law_1.01,0.08940160274505615
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,6144,2560,8,160,2,8,power_law_1.01,0.15066239833831788
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,6144,2560,8,160,2,8,balanced,0.18057066202163696
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,6144,2560,8,160,2,8,power_law_1.01,0.09557759761810303
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,6144,2560,8,160,2,8,power_law_1.01,0.15819519758224487
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,6144,2560,8,160,2,8,balanced,0.20837867259979248
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,6144,2560,8,160,2,8,power_law_1.01,0.06467840075492859
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,6144,2560,8,160,1,16,power_law_1.2,22.9753662109375
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,6144,2560,8,160,2,8,power_law_1.01,0.08701440095901489
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,6144,2560,8,160,2,8,power_law_1.01,0.08633599877357483
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,6144,2560,8,160,2,8,balanced,0.19037866592407227
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,6144,2560,8,160,2,8,power_law_1.01,0.10203520059585572
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,6144,2560,8,160,2,8,power_law_1.01,0.11736960411071777
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,6144,2560,8,160,2,8,power_law_1.01,0.14216959476470947
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,6144,2560,8,160,2,8,balanced,0.2191093365351359
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,6144,2560,8,160,2,8,balanced,1.1403413613637288
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,6144,2560,8,160,2,8,power_law_1.01,0.1383039951324463
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,6144,2560,8,160,2,8,power_law_1.01,0.1706496000289917
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,6144,2560,8,160,2,8,balanced,0.21963733434677124
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,6144,2560,8,160,2,8,power_law_1.01,0.14856319427490233
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,6144,2560,8,160,2,8,balanced,0.04506133496761322
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,6144,2560,8,160,2,8,power_law_1.01,0.09587839841842652
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,6144,2560,8,160,2,8,power_law_1.01,0.22120959758758546
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,6144,2560,8,160,2,8,power_law_1.01,0.15397119522094727
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,6144,2560,8,160,2,8,balanced,0.05041599770387014
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,6144,2560,8,160,2,8,power_law_1.01,0.15274879932403565
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,6144,2560,8,160,2,8,power_law_1.01,0.22933759689331054
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,6144,2560,8,160,2,8,power_law_1.01,0.11463680267333984
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,6144,2560,8,160,2,8,balanced,0.28287466367085773
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,6144,2560,8,160,2,8,power_law_1.01,0.15508480072021485
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,6144,2560,8,160,2,8,balanced,0.06300266583760579
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,6144,2560,8,160,2,8,power_law_1.01,0.06570240259170532
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,6144,2560,8,160,2,8,power_law_1.01,0.2517184019088745
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,6144,2560,8,160,2,8,power_law_1.01,0.16560640335083007
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,6144,2560,8,160,2,8,balanced,0.2773600021998088
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,6144,2560,8,160,2,8,balanced,0.09669333696365356
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,6144,2560,8,160,2,8,power_law_1.01,0.17250560522079467
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,6144,2560,8,160,2,8,power_law_1.01,0.09128320217132568
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,6144,2560,8,160,2,8,power_law_1.01,0.2473599910736084
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,6144,2560,8,160,2,8,power_law_1.01,0.19466880559921265
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,6144,2560,8,160,2,8,balanced,0.13922666509946188
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,6144,2560,8,160,2,8,power_law_1.01,0.10815999507904053
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,6144,2560,8,160,2,8,power_law_1.01,0.24960000514984132
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,6144,2560,8,160,2,8,power_law_1.01,0.20845439434051513
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,6144,2560,8,160,2,8,balanced,1.4758559862772624
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,6144,2560,8,160,2,8,balanced,0.16340800126393637
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,6144,2560,8,160,2,8,balanced,0.3935733238855998
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,6144,2560,8,160,2,8,power_law_1.01,0.23002879619598388
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,6144,2560,8,160,2,8,power_law_1.01,0.1351423978805542
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,6144,2560,8,160,2,8,power_law_1.01,0.2590784072875977
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,6144,2560,8,160,2,8,power_law_1.01,0.21425919532775878
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,6144,2560,8,160,2,8,balanced,0.16485866904258728
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,6144,2560,8,160,2,8,power_law_1.01,0.14398720264434814
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,6144,2560,8,160,2,8,power_law_1.01,0.27070720195770265
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,6144,2560,8,160,2,8,power_law_1.01,0.25423359870910645
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,6144,2560,8,160,2,8,balanced,0.16770132382710776
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,6144,2560,8,160,2,8,power_law_1.01,0.15072640180587768
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,6144,2560,8,160,2,8,balanced,0.40620799859364826
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,6144,2560,8,160,2,8,power_law_1.01,0.2686912059783936
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,6144,2560,8,160,2,8,balanced,0.16785067319869995
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,6144,2560,8,160,2,8,power_law_1.01,0.291212797164917
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,6144,2560,8,160,2,8,power_law_1.01,0.3299263954162598
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,6144,2560,8,160,2,8,power_law_1.01,0.1555199980735779
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,6144,2560,8,160,2,8,balanced,0.16917866468429565
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,6144,2560,8,160,2,8,power_law_1.01,0.28855679035186765
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,6144,2560,8,160,2,8,power_law_1.01,0.35520000457763673
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,6144,2560,8,160,2,8,power_law_1.01,0.15822720527648926
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,6144,2560,8,160,2,8,balanced,0.17057599623998007
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,6144,2560,8,160,2,8,power_law_1.01,0.43614721298217773
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,6144,2560,8,160,2,8,power_law_1.01,0.3324991941452026
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,6144,2560,8,160,2,8,power_law_1.01,0.17204480171203612
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,6144,2560,8,160,2,8,power_law_1.01,0.5901375770568847
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,6144,2560,8,160,2,8,balanced,0.6568160057067871
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,6144,2560,8,160,2,8,balanced,0.17334934075673422
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,6144,2560,8,160,2,8,power_law_1.01,0.3414207935333252
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,6144,2560,8,160,2,8,power_law_1.01,0.8441984176635742
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,6144,2560,8,160,2,8,power_law_1.01,0.17934080362319946
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,6144,2560,8,160,2,8,balanced,0.17670400937398276
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,6144,2560,8,160,2,8,power_law_1.01,0.32767999172210693
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,6144,2560,8,160,2,8,power_law_1.01,0.9450431823730469
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,6144,2560,8,160,2,8,power_law_1.01,0.1950144052505493
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,6144,2560,8,160,2,8,balanced,0.18012799819310507
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,6144,2560,8,160,2,8,balanced,1.7441493670145671
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,6144,2560,8,160,2,8,power_law_1.01,1.2718655586242675
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,6144,2560,8,160,2,8,power_law_1.01,0.4154816150665283
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,6144,2560,8,160,2,8,power_law_1.01,0.2071552038192749
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,6144,2560,8,160,2,8,balanced,0.18610133727391562
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,6144,2560,8,160,2,8,power_law_1.01,1.8324031829833984
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,6144,2560,8,160,2,8,power_law_1.01,0.42934398651123046
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,6144,2560,8,160,2,8,power_law_1.01,0.23545598983764648
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,6144,2560,8,160,2,8,balanced,0.7214879989624023
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,6144,2560,8,160,2,8,power_law_1.01,2.0221183776855467
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,6144,2560,8,160,2,8,power_law_1.01,0.48097920417785645
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,6144,2560,8,160,2,8,power_law_1.01,3.290457534790039
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,6144,2560,8,160,2,8,power_law_1.01,0.5233151912689209
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,6144,2560,8,160,2,8,power_law_1.01,0.5787903785705566
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,6144,2560,8,160,2,8,power_law_1.01,6.835968017578125
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,6144,2560,8,160,2,8,balanced,0.1920213301976522
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,6144,2560,8,160,2,8,power_law_1.01,0.217958402633667
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,6144,2560,8,160,2,8,power_law_1.01,0.8560959815979003
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,6144,2560,8,160,2,8,power_law_1.01,1.0956992149353026
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,6144,2560,8,160,2,8,power_law_1.01,1.3233792304992675
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,6144,2560,8,160,2,8,balanced,0.9456373055775961
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,6144,2560,8,160,2,8,power_law_1.01,1.8695360183715821
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,6144,2560,8,160,2,8,balanced,0.20510933796564737
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,6144,2560,8,160,2,8,power_law_1.01,0.24067840576171876
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,6144,2560,8,160,2,8,power_law_1.01,2.5530176162719727
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,6144,2560,8,160,2,8,power_law_1.01,3.142291259765625
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,6144,2560,8,160,2,8,balanced,2.724186579386393
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,6144,2560,8,160,2,8,power_law_1.01,4.384499359130859
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,6144,2560,8,160,2,8,power_law_1.01,9.577996826171875
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,6144,2560,8,160,2,8,balanced,1.240613301595052
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,6144,2560,8,160,2,8,balanced,0.22207999229431152
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,6144,2560,8,160,2,8,power_law_1.01,0.28127360343933105
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,6144,2560,8,160,2,8,power_law_1.2,0.15004160404205322
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,6144,2560,8,160,2,8,balanced,0.23778667052586874
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,6144,2560,8,160,2,8,power_law_1.01,0.33524479866027834
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,6144,2560,8,160,2,8,power_law_1.2,0.07490559816360473
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,6144,2560,8,160,2,8,power_law_1.2,0.11011199951171875
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,6144,2560,8,160,2,8,power_law_1.2,0.11137919425964356
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,6144,2560,8,160,2,8,power_law_1.2,0.1388543963432312
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,6144,2560,8,160,2,8,power_law_1.2,0.2296447992324829
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,6144,2560,8,160,2,8,balanced,1.4864373207092285
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,6144,2560,8,160,2,8,power_law_1.01,0.38706560134887696
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,6144,2560,8,160,2,8,power_law_1.2,0.231276798248291
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,6144,2560,8,160,2,8,balanced,0.2835413416226705
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,6144,2560,8,160,2,8,power_law_1.2,0.2442239999771118
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,6144,2560,8,160,2,8,power_law_1.01,0.5238912105560303
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,6144,2560,8,160,2,8,balanced,0.3263946572939555
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,6144,2560,8,160,2,8,power_law_1.2,0.25498878955841064
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,6144,2560,8,160,2,8,power_law_1.2,0.257260799407959
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,6144,2560,8,160,2,8,power_law_1.2,0.2628607988357544
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,6144,2560,8,160,2,8,power_law_1.2,0.2854720115661621
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,6144,2560,8,160,2,8,power_law_1.01,0.6582335948944091
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,6144,2560,8,160,2,8,balanced,0.4762880007425944
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,6144,2560,8,160,2,8,power_law_1.2,0.2881407976150513
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,6144,2560,8,160,2,8,power_law_1.01,0.7968768119812012
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,6144,2560,8,160,2,8,power_law_1.2,0.32627201080322266
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,6144,2560,8,160,2,8,power_law_1.2,0.34456961154937743
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,6144,2560,8,160,2,8,balanced,0.552021344502767
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,6144,2560,8,160,2,8,power_law_1.2,0.37411839962005616
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,6144,2560,8,160,2,8,power_law_1.01,1.1743040084838867
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,6144,2560,8,160,2,8,power_law_1.2,0.36231679916381837
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,6144,2560,8,160,2,8,power_law_1.01,1.5561471939086915
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,6144,2560,8,160,2,8,power_law_1.2,0.40968961715698243
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,6144,2560,8,160,2,8,balanced,2.3045600255330405
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,6144,2560,8,160,2,8,balanced,5.348213195800781
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,6144,2560,8,160,2,8,balanced,0.7907733122507731
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,6144,2560,8,160,2,8,power_law_1.2,0.4448703765869141
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,6144,2560,8,160,2,8,power_law_1.01,2.2180095672607423
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,6144,2560,8,160,2,8,power_law_1.2,0.5486207962036133
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,6144,2560,8,160,2,8,power_law_1.01,3.301708984375
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,6144,2560,8,160,2,8,power_law_1.2,0.532102394104004
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,6144,2560,8,160,2,8,power_law_1.01,3.870809555053711
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,6144,2560,8,160,2,8,power_law_1.2,0.6826879978179932
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,6144,2560,8,160,2,8,balanced,1.053978681564331
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,6144,2560,8,160,2,8,power_law_1.2,0.9854335784912109
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,6144,2560,8,160,2,8,power_law_1.01,5.369996643066406
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,6144,2560,8,160,2,8,power_law_1.2,1.3423935890197753
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,6144,2560,8,160,2,8,power_law_1.01,11.816544342041016
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,6144,2560,8,160,2,8,power_law_1.2,1.6555776596069336
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,6144,2560,8,160,2,8,balanced,1.464421272277832
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,6144,2560,8,160,2,8,power_law_1.2,2.2296192169189455
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,6144,2560,8,160,2,8,power_law_1.2,3.418201446533203
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,6144,2560,8,160,2,8,power_law_1.2,3.4156864166259764
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,6144,2560,8,160,2,8,power_law_1.2,6.792147064208985
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,6144,2560,8,160,2,8,balanced,1.933509349822998
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,6144,2560,8,160,2,8,power_law_1.2,12.065740966796875
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,6144,2560,8,160,2,8,power_law_1.2,0.0945855975151062
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,6144,2560,8,160,2,8,balanced,2.340218702952067
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,6144,2560,8,160,2,8,balanced,4.530538558959961
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,6144,2560,8,160,2,8,power_law_1.2,0.0680191993713379
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,6144,2560,8,160,2,8,power_law_1.2,0.06914560198783874
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,6144,2560,8,160,2,8,power_law_1.2,0.07735679745674133
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,6144,2560,8,160,2,8,power_law_1.2,0.10443520545959473
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,6144,2560,8,160,2,8,power_law_1.2,0.1414463996887207
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,6144,2560,8,160,2,8,power_law_1.2,0.1484544038772583
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,6144,2560,8,160,2,8,power_law_1.2,0.1449087977409363
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,6144,2560,8,160,2,8,power_law_1.2,0.1562432050704956
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,6144,2560,8,160,2,8,power_law_1.2,0.15211520195007325
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,6144,2560,8,160,2,8,power_law_1.2,0.16254719495773315
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,6144,2560,8,160,2,8,power_law_1.2,0.17147519588470458
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,6144,2560,8,160,2,8,power_law_1.2,0.1699072003364563
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,6144,2560,8,160,2,8,balanced,3.7242507934570312
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,6144,2560,8,160,2,8,power_law_1.2,0.20236799716949463
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,6144,2560,8,160,2,8,power_law_1.2,0.22076799869537353
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,6144,2560,8,160,2,8,power_law_1.2,0.22595200538635254
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,6144,2560,8,160,2,8,power_law_1.2,0.0963648021221161
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,6144,2560,8,160,2,8,power_law_1.2,0.23228800296783447
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,6144,2560,8,160,2,8,power_law_1.2,0.06684799790382386
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,6144,2560,8,160,2,8,power_law_1.2,0.25505919456481935
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,6144,2560,8,160,2,8,power_law_1.2,0.06247680187225342
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,6144,2560,8,160,2,8,power_law_1.2,0.2835007905960083
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,6144,2560,8,160,2,8,power_law_1.2,0.36550400257110593
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,6144,2560,8,160,2,8,power_law_1.2,0.09500160217285156
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,6144,2560,8,160,2,8,power_law_1.2,0.3967103958129883
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,6144,2560,8,160,2,8,power_law_1.2,0.09264640212059021
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,6144,2560,8,160,2,8,power_law_1.2,0.14324480295181274
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,6144,2560,8,160,2,8,power_law_1.2,0.5025087833404541
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,6144,2560,8,160,2,8,power_law_1.2,0.1473471999168396
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,6144,2560,8,160,2,8,power_law_1.2,0.6753664016723633
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,6144,2560,8,160,2,8,power_law_1.2,0.9072959899902344
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,6144,2560,8,160,2,8,power_law_1.2,0.14420479536056519
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,6144,2560,8,160,2,8,power_law_1.2,0.1622207999229431
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,6144,2560,8,160,2,8,power_law_1.2,1.038809585571289
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,6144,2560,8,160,2,8,power_law_1.2,0.1644927978515625
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,6144,2560,8,160,2,8,power_law_1.2,1.6369855880737305
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,6144,2560,8,160,4,4,balanced,0.05691199998060862
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,6144,2560,8,160,2,8,power_law_1.2,0.17149440050125123
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,6144,2560,8,160,4,4,balanced,0.06320000191529591
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,6144,2560,8,160,2,8,power_law_1.2,2.3864831924438477
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,6144,2560,8,160,2,8,power_law_1.2,0.18844159841537475
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,6144,2560,8,160,4,4,balanced,0.08546132842699687
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,6144,2560,8,160,4,4,balanced,0.12777599692344666
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,6144,2560,8,160,2,8,power_law_1.2,0.20045440196990966
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,6144,2560,8,160,2,8,power_law_1.2,2.4701887130737306
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,6144,2560,8,160,4,4,balanced,0.23566399017969766
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,6144,2560,8,160,2,8,power_law_1.2,0.22047359943389894
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,6144,2560,8,160,4,4,balanced,0.2725920081138611
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,6144,2560,8,160,2,8,power_law_1.2,4.060262298583984
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,6144,2560,8,160,4,4,balanced,0.2747360070546468
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,6144,2560,8,160,2,8,power_law_1.2,0.24101760387420654
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,6144,2560,8,160,4,4,balanced,0.26529600222905475
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,6144,2560,8,160,4,4,balanced,0.26678399244944256
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,6144,2560,8,160,2,8,power_law_1.2,8.687161254882813
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,6144,2560,8,160,4,4,balanced,0.2677440047264099
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,6144,2560,8,160,2,8,power_law_1.2,0.23894400596618653
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,6144,2560,8,160,4,4,balanced,0.2699199914932251
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,6144,2560,8,160,4,4,balanced,0.2722613414128621
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,6144,2560,8,160,4,4,balanced,0.27517332633336383
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,6144,2560,8,160,4,4,balanced,0.27981332937876385
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,6144,2560,8,160,2,8,power_law_1.2,0.2578752040863037
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,6144,2560,8,160,4,4,balanced,0.28625067075093585
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,6144,2560,8,160,2,8,balanced,7.406592051188151
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,6144,2560,8,160,4,4,balanced,0.32340800762176514
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,6144,2560,8,160,4,4,balanced,0.3115520079930623
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,6144,2560,8,160,2,8,power_law_1.2,0.2786880016326904
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,6144,2560,8,160,4,4,balanced,0.41733864943186444
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,6144,2560,8,160,2,8,power_law_1.2,0.33282558917999266
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,6144,2560,8,160,4,4,balanced,0.3473973274230957
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,6144,2560,8,160,4,4,balanced,0.4050826629002889
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,6144,2560,8,160,2,8,power_law_1.2,0.4195072174072266
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,6144,2560,8,160,4,4,balanced,0.39826667308807373
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,6144,2560,8,160,2,8,power_law_1.2,0.5132736206054688
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,6144,2560,8,160,4,4,balanced,0.6122986475626627
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,6144,2560,8,160,2,8,power_law_1.2,0.6867392063140869
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,6144,2560,8,160,2,8,power_law_1.2,0.9135295867919921
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,6144,2560,8,160,4,4,balanced,0.04730666677157084
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,6144,2560,8,160,4,4,balanced,0.5744053522745768
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,6144,2560,8,160,4,4,balanced,0.05220800141493479
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,6144,2560,8,160,2,8,power_law_1.2,1.335257625579834
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,6144,2560,8,160,4,4,balanced,0.06407999992370605
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,6144,2560,8,160,4,4,balanced,0.09962667028109233
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,6144,2560,8,160,4,4,balanced,0.1400266687075297
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,6144,2560,8,160,4,4,balanced,0.9891946315765381
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,6144,2560,8,160,2,8,power_law_1.2,2.1826175689697265
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,6144,2560,8,160,4,4,balanced,0.16355733076731363
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,6144,2560,8,160,4,4,balanced,0.16531733671824136
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,6144,2560,8,160,2,8,power_law_1.2,2.7694015502929688
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,6144,2560,8,160,4,4,balanced,0.16989866892496744
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,6144,2560,8,160,4,4,balanced,0.169487992922465
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,6144,2560,8,160,4,4,balanced,1.0417546431223552
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,6144,2560,8,160,2,8,power_law_1.2,3.252409744262695
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,6144,2560,8,160,4,4,balanced,0.17241599162419638
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,6144,2560,8,160,4,4,balanced,0.17218667268753052
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,6144,2560,8,160,2,8,power_law_1.2,4.453030395507812
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,6144,2560,8,160,4,4,balanced,0.1734666625658671
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,6144,2560,8,160,4,4,balanced,0.17612799008687338
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,6144,2560,8,160,2,8,power_law_1.2,7.209414672851563
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,6144,2560,8,160,4,4,balanced,0.1803306738535563
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,6144,2560,8,160,4,4,balanced,1.3373279571533203
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,6144,2560,8,160,4,4,balanced,0.18818666537602743
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,6144,2560,8,160,2,8,power_law_1.2,18.836134338378905
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,6144,2560,8,160,4,4,balanced,0.21156267325083414
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,6144,2560,8,160,4,4,balanced,0.051642666260401406
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,6144,2560,8,160,4,4,balanced,0.2003306746482849
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,6144,2560,8,160,4,4,balanced,0.055200000603993736
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,6144,2560,8,160,4,4,balanced,0.2629973292350769
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,6144,2560,8,160,4,4,balanced,0.06753066678841908
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,6144,2560,8,160,4,4,balanced,0.09990400075912476
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,6144,2560,8,160,4,4,balanced,0.24125333627065024
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,6144,2560,8,160,4,4,balanced,0.14495999614397684
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,6144,2560,8,160,4,4,balanced,1.7669119834899902
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,6144,2560,8,160,4,4,balanced,0.33113600810368854
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,6144,2560,8,160,4,4,balanced,0.1685546636581421
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,6144,2560,8,160,4,4,balanced,0.17282134294509888
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,6144,2560,8,160,4,4,power_law_1.01,0.08954240083694458
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,6144,2560,8,160,4,4,balanced,0.3123146692911784
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,6144,2560,8,160,4,4,balanced,0.17338132858276367
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,6144,2560,8,160,4,4,power_law_1.01,0.1167296051979065
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,6144,2560,8,160,4,4,balanced,0.17583467562993368
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,6144,2560,8,160,4,4,power_law_1.01,0.08107519745826722
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,6144,2560,8,160,4,4,balanced,0.44968533515930176
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,6144,2560,8,160,4,4,balanced,0.1776799956957499
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,6144,2560,8,160,4,4,power_law_1.01,0.10844160318374634
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,6144,2560,8,160,4,4,balanced,0.18021865685780844
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,6144,2560,8,160,4,4,power_law_1.01,0.1505344033241272
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,6144,2560,8,160,4,4,balanced,0.48711466789245605
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,6144,2560,8,160,4,4,balanced,0.18580265839894614
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,6144,2560,8,160,4,4,power_law_1.01,0.06639999747276307
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,6144,2560,8,160,4,4,power_law_1.01,0.22307200431823732
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,6144,2560,8,160,4,4,balanced,0.1875200072924296
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,6144,2560,8,160,4,4,balanced,2.116192022959391
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,6144,2560,8,160,4,4,power_law_1.01,0.22510080337524413
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,6144,2560,8,160,4,4,power_law_1.01,0.0760703980922699
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,6144,2560,8,160,4,4,balanced,0.1946880022684733
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,6144,2560,8,160,4,4,power_law_1.01,0.062015998363494876
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,6144,2560,8,160,4,4,power_law_1.01,0.23457279205322265
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,6144,2560,8,160,4,4,balanced,0.20363199710845947
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,6144,2560,8,160,4,4,balanced,0.7669066588083903
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,6144,2560,8,160,4,4,power_law_1.01,0.09675520062446594
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,6144,2560,8,160,4,4,power_law_1.01,0.24515841007232667
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,6144,2560,8,160,4,4,power_law_1.01,0.10174720287322998
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,6144,2560,8,160,4,4,power_law_1.01,0.13879679441452025
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,6144,2560,8,160,4,4,power_law_1.01,0.256057596206665
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,6144,2560,8,160,4,4,power_law_1.01,0.14001280069351196
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,6144,2560,8,160,4,4,power_law_1.01,0.26883840560913086
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,6144,2560,8,160,4,4,power_law_1.01,0.14828799962997435
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,6144,2560,8,160,4,4,power_law_1.01,0.26398720741271975
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,6144,2560,8,160,4,4,balanced,0.21382933855056763
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,6144,2560,8,160,4,4,power_law_1.01,0.14994560480117797
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,6144,2560,8,160,4,4,balanced,0.8712213039398193
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,6144,2560,8,160,4,4,power_law_1.01,0.15308799743652343
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,6144,2560,8,160,4,4,power_law_1.01,0.2791296005249023
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,6144,2560,8,160,4,4,power_law_1.01,0.16163840293884277
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,6144,2560,8,160,4,4,power_law_1.01,0.30709760189056395
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,6144,2560,8,160,4,4,power_law_1.01,0.16838400363922118
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,6144,2560,8,160,4,4,power_law_1.01,0.3138432025909424
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,6144,2560,8,160,4,4,power_law_1.01,0.1776703953742981
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,6144,2560,8,160,4,4,power_law_1.01,0.3334847927093506
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,6144,2560,8,160,4,4,power_law_1.01,0.18867839574813844
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,6144,2560,8,160,4,4,balanced,0.22816532850265503
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,6144,2560,8,160,4,4,power_law_1.01,0.20571520328521728
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,6144,2560,8,160,4,4,power_law_1.01,0.35097599029541016
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,6144,2560,8,160,4,4,power_law_1.01,0.21813759803771973
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,6144,2560,8,160,4,4,power_law_1.01,0.3929919958114624
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,6144,2560,8,160,4,4,balanced,1.182469367980957
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,6144,2560,8,160,4,4,power_law_1.01,0.22041599750518798
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,6144,2560,8,160,4,4,power_law_1.01,0.42055678367614746
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,6144,2560,8,160,4,4,power_law_1.01,0.26447999477386475
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,6144,2560,8,160,4,4,balanced,3.2665065129597983
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,6144,2560,8,160,4,4,power_law_1.01,0.467244815826416
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,6144,2560,8,160,4,4,power_law_1.01,0.27017600536346437
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,6144,2560,8,160,4,4,power_law_1.01,0.558515214920044
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,6144,2560,8,160,4,4,power_law_1.01,0.3396352052688599
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,6144,2560,8,160,4,4,power_law_1.01,0.381606388092041
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,6144,2560,8,160,4,4,power_law_1.01,0.6974656105041503
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,6144,2560,8,160,4,4,balanced,0.26255999008814496
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,6144,2560,8,160,4,4,power_law_1.01,0.4917247772216797
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,6144,2560,8,160,4,4,power_law_1.01,0.8830400466918945
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,6144,2560,8,160,4,4,power_law_1.01,0.6354368209838868
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,6144,2560,8,160,4,4,balanced,0.29633599519729614
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,6144,2560,8,160,4,4,power_law_1.01,1.0979647636413574
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,6144,2560,8,160,4,4,power_law_1.01,0.8688703536987304
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,6144,2560,8,160,4,4,balanced,1.545962651570638
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,6144,2560,8,160,4,4,power_law_1.01,1.035654354095459
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,6144,2560,8,160,4,4,power_law_1.01,1.2154687881469726
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,6144,2560,8,160,4,4,power_law_1.01,1.4010623931884765
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,6144,2560,8,160,4,4,power_law_1.01,1.8223167419433595
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,6144,2560,8,160,4,4,balanced,0.3864106734593709
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,6144,2560,8,160,4,4,power_law_1.01,1.9033472061157226
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,6144,2560,8,160,4,4,power_law_1.01,2.314988708496094
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,6144,2560,8,160,4,4,power_law_1.01,2.3444223403930664
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,6144,2560,8,160,4,4,balanced,0.4487893184026082
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,6144,2560,8,160,4,4,power_law_1.01,2.6572736740112304
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,6144,2560,8,160,4,4,power_law_1.01,4.016198348999024
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,6144,2560,8,160,4,4,power_law_1.01,4.255628967285157
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,6144,2560,8,160,4,4,power_law_1.01,7.315277099609375
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,6144,2560,8,160,4,4,power_law_1.01,8.117459106445313
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,6144,2560,8,160,4,4,balanced,0.6685547033945719
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,6144,2560,8,160,4,4,balanced,1.853962739308675
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,6144,2560,8,160,4,4,balanced,0.7964320182800293
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,6144,2560,8,160,4,4,power_law_1.01,0.07304959893226623
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,6144,2560,8,160,4,4,balanced,1.1407679716746013
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,6144,2560,8,160,4,4,power_law_1.01,0.09413759708404541
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,6144,2560,8,160,4,4,power_law_1.01,0.06532480120658875
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,6144,2560,8,160,4,4,power_law_1.2,0.08918399810791015
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,6144,2560,8,160,4,4,power_law_1.01,0.08646399974822998
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,6144,2560,8,160,4,4,power_law_1.2,0.07316480278968811
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,6144,2560,8,160,4,4,balanced,1.5131840705871582
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,6144,2560,8,160,4,4,power_law_1.2,0.07702400088310242
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,6144,2560,8,160,4,4,power_law_1.01,0.10856959819793702
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,6144,2560,8,160,4,4,balanced,6.459605534871419
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,6144,2560,8,160,4,4,power_law_1.2,0.10424959659576416
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,6144,2560,8,160,4,4,power_law_1.01,0.1476863980293274
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,6144,2560,8,160,4,4,power_law_1.2,0.1326464056968689
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,6144,2560,8,160,4,4,power_law_1.01,0.1551424026489258
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,6144,2560,8,160,4,4,balanced,2.904266675313314
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,6144,2560,8,160,4,4,power_law_1.2,0.21154561042785644
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,6144,2560,8,160,4,4,power_law_1.01,0.15520639419555665
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,6144,2560,8,160,4,4,power_law_1.2,0.2344575881958008
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,6144,2560,8,160,4,4,power_law_1.01,0.1627071976661682
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,6144,2560,8,160,4,4,power_law_1.2,0.23407359123229982
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,6144,2560,8,160,4,4,balanced,2.123232046763102
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,6144,2560,8,160,4,4,power_law_1.01,0.17440639734268187
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,6144,2560,8,160,4,4,power_law_1.2,0.24908800125122071
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,6144,2560,8,160,4,4,power_law_1.01,0.18752000331878663
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,6144,2560,8,160,4,4,power_law_1.2,0.2591808080673218
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,6144,2560,8,160,4,4,power_law_1.01,0.19909759759902954
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,6144,2560,8,160,4,4,power_law_1.2,0.2742079973220825
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,6144,2560,8,160,4,4,power_law_1.01,0.2022847890853882
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,6144,2560,8,160,4,4,power_law_1.2,0.2846719980239868
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,6144,2560,8,160,4,4,power_law_1.2,0.2918848037719727
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,6144,2560,8,160,4,4,power_law_1.01,0.22291839122772217
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,6144,2560,8,160,4,4,power_law_1.2,0.3201215982437134
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,6144,2560,8,160,4,4,power_law_1.01,0.2401599884033203
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,6144,2560,8,160,4,4,balanced,2.827365239461263
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,6144,2560,8,160,4,4,power_law_1.2,0.3315520048141479
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,6144,2560,8,160,4,4,power_law_1.2,0.3546816110610962
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,6144,2560,8,160,4,4,power_law_1.01,0.2454080104827881
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,6144,2560,8,160,4,4,power_law_1.2,0.35859839916229247
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,6144,2560,8,160,4,4,power_law_1.2,0.43920001983642576
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,6144,2560,8,160,4,4,power_law_1.01,0.2756736040115356
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,6144,2560,8,160,4,4,power_law_1.2,0.4245312213897705
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,6144,2560,8,160,4,4,power_law_1.2,0.49854722023010256
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,6144,2560,8,160,4,4,power_law_1.2,0.5802879810333252
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,6144,2560,8,160,4,4,power_law_1.01,0.30850560665130616
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,6144,2560,8,160,4,4,power_law_1.2,0.7556159973144532
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,6144,2560,8,160,4,4,balanced,3.4300800959269204
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,6144,2560,8,160,4,4,power_law_1.01,0.3764031887054443
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,6144,2560,8,160,4,4,power_law_1.2,0.9656831741333007
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,6144,2560,8,160,4,4,power_law_1.2,1.2998527526855468
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,6144,2560,8,160,4,4,power_law_1.01,0.49753599166870116
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,6144,2560,8,160,4,4,power_law_1.01,0.6153791904449463
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,6144,2560,8,160,4,4,power_law_1.2,1.4997504234313965
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,6144,2560,8,160,4,4,power_law_1.2,1.9535232543945313
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,6144,2560,8,160,4,4,power_law_1.01,0.7820735931396484
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,6144,2560,8,160,4,4,power_law_1.2,0.06587520241737366
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,6144,2560,8,160,4,4,balanced,5.745738983154297
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,6144,2560,8,160,4,4,power_law_1.2,2.7674240112304687
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,6144,2560,8,160,4,4,power_law_1.01,0.9745920181274415
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,6144,2560,8,160,4,4,power_law_1.2,0.05804799795150757
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,6144,2560,8,160,4,4,power_law_1.01,1.3466496467590332
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,6144,2560,8,160,4,4,power_law_1.2,3.4388607025146483
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,6144,2560,8,160,4,4,power_law_1.2,0.061964797973632815
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,6144,2560,8,160,4,4,power_law_1.01,1.9775423049926757
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,6144,2560,8,160,4,4,power_law_1.2,0.08300799727439881
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,6144,2560,8,160,4,4,power_law_1.2,5.073900985717773
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,6144,2560,8,160,4,4,power_law_1.01,2.658425521850586
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,6144,2560,8,160,4,4,power_law_1.2,0.10056960582733154
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,6144,2560,8,160,4,4,power_law_1.01,3.3507328033447266
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,6144,2560,8,160,4,4,power_law_1.2,0.13345919847488402
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,6144,2560,8,160,4,4,power_law_1.2,12.131775665283204
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,6144,2560,8,160,4,4,power_law_1.2,0.13998719453811645
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,6144,2560,8,160,4,4,power_law_1.01,4.570265579223633
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,6144,2560,8,160,4,4,balanced,5.418303807576497
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,6144,2560,8,160,4,4,power_law_1.2,0.14918400049209596
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,6144,2560,8,160,4,4,power_law_1.01,7.0044097900390625
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,6144,2560,8,160,4,4,power_law_1.2,0.1519551992416382
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,6144,2560,8,160,4,4,power_law_1.2,0.1598528027534485
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,6144,2560,8,160,4,4,power_law_1.01,14.527877807617188
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,6144,2560,8,160,4,4,power_law_1.2,0.171942400932312
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,6144,2560,8,160,4,4,power_law_1.2,0.18199039697647096
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,6144,2560,8,160,4,4,power_law_1.2,0.1841472029685974
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,6144,2560,8,160,4,4,power_law_1.2,0.1982848048210144
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,6144,2560,8,160,4,4,power_law_1.2,0.2018496036529541
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,6144,2560,8,160,4,4,power_law_1.2,0.22068479061126708
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,6144,2560,8,160,4,4,power_law_1.2,0.23055999279022216
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,6144,2560,8,160,4,4,power_law_1.2,0.27935359477996824
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,6144,2560,8,160,4,4,power_law_1.2,0.28961920738220215
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,6144,2560,8,160,4,4,power_law_1.2,0.35248000621795655
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,6144,2560,8,160,4,4,power_law_1.2,0.4055488109588623
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,6144,2560,8,160,4,4,power_law_1.2,0.5565824031829834
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,6144,2560,8,160,4,4,power_law_1.2,0.6823423862457275
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,6144,2560,8,160,4,4,power_law_1.2,0.9510208129882812
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,6144,2560,8,160,4,4,power_law_1.2,1.163532829284668
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,6144,2560,8,160,4,4,power_law_1.2,1.6857023239135742
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,6144,2560,8,160,4,4,power_law_1.2,1.9849151611328124
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,6144,2560,8,160,4,4,power_law_1.2,2.524038314819336
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,6144,2560,8,160,4,4,balanced,10.800821940104166
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,6144,2560,8,160,4,4,power_law_1.2,4.688281631469726
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,6144,2560,8,160,4,4,power_law_1.2,8.773567962646485
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,6144,2560,8,160,8,2,balanced,0.059477334221204124
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,6144,2560,8,160,8,2,balanced,0.06810133159160614
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,6144,2560,8,160,8,2,balanced,0.08795199791590373
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,6144,2560,8,160,8,2,balanced,0.13169067104657492
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,6144,2560,8,160,4,4,power_law_1.2,0.0720192015171051
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,6144,2560,8,160,8,2,balanced,0.23882132768630981
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,6144,2560,8,160,4,4,power_law_1.2,0.060127997398376466
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,6144,2560,8,160,8,2,balanced,0.2790079911549886
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,6144,2560,8,160,4,4,power_law_1.2,0.06444159746170045
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,6144,2560,8,160,8,2,balanced,0.28064000606536865
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,6144,2560,8,160,4,4,power_law_1.2,0.0864192008972168
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,6144,2560,8,160,8,2,balanced,0.27452266216278076
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,6144,2560,8,160,4,4,power_law_1.2,0.09873279929161072
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,6144,2560,8,160,8,2,balanced,0.2731626629829407
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,6144,2560,8,160,4,4,power_law_1.2,0.13733760118484498
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,6144,2560,8,160,8,2,balanced,0.2755413254102071
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,6144,2560,8,160,4,4,power_law_1.2,0.15801600217819214
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,6144,2560,8,160,8,2,balanced,0.2821706732114156
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,6144,2560,8,160,8,2,balanced,0.04980266590913137
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,6144,2560,8,160,8,2,balanced,0.28246933221817017
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,6144,2560,8,160,4,4,power_law_1.2,0.15915520191192628
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,6144,2560,8,160,8,2,balanced,0.05725333094596863
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,6144,2560,8,160,8,2,balanced,0.2852320075035095
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,6144,2560,8,160,4,4,power_law_1.2,0.16228480339050294
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,6144,2560,8,160,8,2,balanced,0.06945066650708516
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,6144,2560,8,160,8,2,balanced,0.2905706763267517
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,6144,2560,8,160,4,4,power_law_1.2,0.17921919822692872
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,6144,2560,8,160,8,2,balanced,0.10640000303586324
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,6144,2560,8,160,8,2,balanced,0.30348267157872516
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,6144,2560,8,160,4,4,power_law_1.2,0.18862080574035645
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,6144,2560,8,160,8,2,balanced,0.15355199575424194
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,6144,2560,8,160,4,4,power_law_1.2,0.19112319946289064
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,6144,2560,8,160,8,2,balanced,0.3208693265914917
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,6144,2560,8,160,8,2,balanced,0.17819732427597046
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,6144,2560,8,160,4,4,power_law_1.2,0.20787839889526366
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,6144,2560,8,160,8,2,balanced,0.3294559915860494
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,6144,2560,8,160,8,2,balanced,0.18041066328684488
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,6144,2560,8,160,4,4,power_law_1.2,0.23582720756530762
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,6144,2560,8,160,8,2,balanced,0.18288532892862955
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,6144,2560,8,160,8,2,balanced,0.4058719873428345
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,6144,2560,8,160,8,2,balanced,0.18691732486089072
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,6144,2560,8,160,4,4,power_law_1.2,0.2509376049041748
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,6144,2560,8,160,8,2,balanced,0.38467733065287274
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,6144,2560,8,160,8,2,balanced,0.1888213356335958
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,6144,2560,8,160,8,2,balanced,0.18950400749842325
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,6144,2560,8,160,8,2,balanced,0.5297813415527344
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,6144,2560,8,160,4,4,power_law_1.2,0.25063679218292234
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,6144,2560,8,160,8,2,balanced,0.19666133324305216
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,6144,2560,8,160,8,2,balanced,0.47467732429504395
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,6144,2560,8,160,8,2,balanced,0.19739200671513876
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,6144,2560,8,160,8,2,balanced,0.20371200640996298
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,6144,2560,8,160,4,4,power_law_1.2,0.2754175901412964
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,6144,2560,8,160,8,2,balanced,0.21289600928624472
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,6144,2560,8,160,8,2,balanced,0.6991786956787109
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,6144,2560,8,160,8,2,balanced,0.21772799889246622
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,6144,2560,8,160,4,4,power_law_1.2,0.3427072048187256
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,6144,2560,8,160,8,2,balanced,0.23293866713841757
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,6144,2560,8,160,8,2,balanced,0.7421173254648844
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,6144,2560,8,160,4,4,power_law_1.2,0.41777920722961426
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,6144,2560,8,160,8,2,balanced,0.30476800600687665
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,6144,2560,8,160,8,2,balanced,0.29098665714263916
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,6144,2560,8,160,4,4,power_law_1.2,0.4970367908477783
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,6144,2560,8,160,4,4,power_law_1.2,0.5880512237548828
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,6144,2560,8,160,8,2,balanced,1.232965310414632
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,6144,2560,8,160,8,2,balanced,0.3816159963607788
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,6144,2560,8,160,4,4,power_law_1.2,0.8716799736022949
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,6144,2560,8,160,8,2,balanced,0.38808000087738037
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,6144,2560,8,160,4,4,power_law_1.2,1.0097344398498536
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,6144,2560,8,160,8,2,balanced,0.5650879939397176
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,6144,2560,8,160,4,4,power_law_1.2,1.6807680130004883
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,6144,2560,8,160,8,2,balanced,1.3365599314371746
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,6144,2560,8,160,4,4,power_law_1.2,2.0749568939208984
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,6144,2560,8,160,4,4,power_law_1.2,3.1564096450805663
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,6144,2560,8,160,8,2,balanced,0.644266684850057
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,6144,2560,8,160,4,4,power_law_1.2,3.7879425048828126
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,6144,2560,8,160,8,2,power_law_1.01,0.06552960276603699
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,6144,2560,8,160,4,4,power_law_1.2,5.087007904052735
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,6144,2560,8,160,8,2,balanced,1.9968053499857585
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,6144,2560,8,160,8,2,balanced,1.0400746663411458
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,6144,2560,8,160,8,2,power_law_1.01,0.07479680180549622
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,6144,2560,8,160,8,2,power_law_1.01,0.08103039860725403
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,6144,2560,8,160,4,4,power_law_1.2,8.818611145019531
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,6144,2560,8,160,8,2,power_law_1.01,0.10945279598236084
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,6144,2560,8,160,8,2,power_law_1.01,0.14479999542236327
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,6144,2560,8,160,8,2,power_law_1.01,0.22400639057159424
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,6144,2560,8,160,4,4,power_law_1.2,18.371212768554688
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,6144,2560,8,160,8,2,balanced,1.211674690246582
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,6144,2560,8,160,8,2,balanced,0.0655626654624939
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,6144,2560,8,160,8,2,power_law_1.01,0.23678719997406006
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,6144,2560,8,160,8,2,power_law_1.01,0.05459200143814087
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,6144,2560,8,160,8,2,balanced,0.07049599786599477
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,6144,2560,8,160,8,2,power_law_1.01,0.24481918811798095
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,6144,2560,8,160,8,2,balanced,0.08156266808509827
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,6144,2560,8,160,8,2,power_law_1.01,0.0648256003856659
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,6144,2560,8,160,8,2,balanced,2.575157324473063
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,6144,2560,8,160,8,2,power_law_1.01,0.25435519218444824
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,6144,2560,8,160,8,2,balanced,0.11495467027028401
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,6144,2560,8,160,8,2,power_law_1.01,0.06380800008773804
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,6144,2560,8,160,8,2,power_law_1.01,0.26416640281677245
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,6144,2560,8,160,8,2,balanced,0.16171733538309732
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,6144,2560,8,160,8,2,power_law_1.01,0.08810240030288696
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,6144,2560,8,160,8,2,power_law_1.01,0.2728319883346558
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,6144,2560,8,160,8,2,balanced,1.764095942179362
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,6144,2560,8,160,8,2,balanced,0.19262399276097616
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,6144,2560,8,160,8,2,power_law_1.01,0.10801279544830322
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,6144,2560,8,160,8,2,power_law_1.01,0.29185919761657714
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,6144,2560,8,160,8,2,balanced,0.1940106749534607
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,6144,2560,8,160,8,2,power_law_1.01,0.1461184024810791
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,6144,2560,8,160,8,2,power_law_1.01,0.3012095928192139
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,6144,2560,8,160,8,2,balanced,0.19650665918986002
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,6144,2560,8,160,8,2,power_law_1.01,0.1533504009246826
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,6144,2560,8,160,8,2,power_law_1.01,0.3016511917114258
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,6144,2560,8,160,8,2,balanced,0.2014453411102295
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,6144,2560,8,160,8,2,power_law_1.01,0.16581120491027831
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,6144,2560,8,160,8,2,power_law_1.01,0.3271615982055664
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,6144,2560,8,160,8,2,balanced,0.2036693294843038
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,6144,2560,8,160,8,2,power_law_1.01,0.17061760425567626
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,6144,2560,8,160,8,2,power_law_1.01,0.35422720909118655
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,6144,2560,8,160,8,2,power_law_1.01,0.17277439832687377
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,6144,2560,8,160,8,2,balanced,0.21179733673731485
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,6144,2560,8,160,8,2,balanced,2.912480036417643
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,6144,2560,8,160,8,2,power_law_1.01,0.18247679471969605
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,6144,2560,8,160,8,2,power_law_1.01,0.3606015920639038
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,6144,2560,8,160,8,2,balanced,2.2875839869181314
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,6144,2560,8,160,8,2,balanced,0.21711466709772745
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,6144,2560,8,160,8,2,power_law_1.01,0.19392640590667726
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,6144,2560,8,160,8,2,power_law_1.01,0.4208384037017822
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,6144,2560,8,160,8,2,balanced,0.22562666734059653
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,6144,2560,8,160,8,2,power_law_1.01,0.20249600410461427
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,6144,2560,8,160,8,2,power_law_1.01,0.44867839813232424
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,6144,2560,8,160,8,2,balanced,0.2360373338063558
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,6144,2560,8,160,8,2,power_law_1.01,0.20747520923614501
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,6144,2560,8,160,8,2,power_law_1.01,0.5548031806945801
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,6144,2560,8,160,8,2,balanced,0.2509066661198934
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,6144,2560,8,160,8,2,power_law_1.01,0.22255361080169678
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,6144,2560,8,160,8,2,power_law_1.01,0.5856704235076904
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,6144,2560,8,160,8,2,power_law_1.01,0.23484160900115966
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,6144,2560,8,160,8,2,power_law_1.01,0.7384255886077881
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,6144,2560,8,160,8,2,power_law_1.01,0.25061759948730467
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,6144,2560,8,160,8,2,power_law_1.01,0.2983936071395874
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,6144,2560,8,160,8,2,power_law_1.01,1.0219584465026856
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,6144,2560,8,160,8,2,balanced,0.271071990331014
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,6144,2560,8,160,8,2,power_law_1.01,0.3255808115005493
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,6144,2560,8,160,8,2,power_law_1.01,1.2846464157104491
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,6144,2560,8,160,8,2,balanced,2.622901280721029
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,6144,2560,8,160,8,2,power_law_1.01,0.4043712139129639
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,6144,2560,8,160,8,2,power_law_1.01,1.5883071899414063
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,6144,2560,8,160,8,2,power_law_1.01,0.44675841331481936
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,6144,2560,8,160,8,2,power_law_1.2,0.066457599401474
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,6144,2560,8,160,8,2,power_law_1.01,2.2601856231689452
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,6144,2560,8,160,8,2,power_law_1.01,0.6251391887664794
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,6144,2560,8,160,8,2,balanced,0.2985066572825114
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,6144,2560,8,160,8,2,power_law_1.2,0.06503040194511414
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,6144,2560,8,160,8,2,power_law_1.01,0.7974080085754395
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,6144,2560,8,160,8,2,power_law_1.01,2.7468799591064452
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,6144,2560,8,160,8,2,balanced,4.547552108764648
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,6144,2560,8,160,8,2,power_law_1.01,0.06835839748382569
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,6144,2560,8,160,8,2,power_law_1.2,0.08088319897651672
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,6144,2560,8,160,8,2,power_law_1.01,1.0880191802978516
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,6144,2560,8,160,8,2,power_law_1.01,3.468000030517578
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,6144,2560,8,160,8,2,power_law_1.01,0.077702397108078
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,6144,2560,8,160,8,2,power_law_1.2,0.10049279928207397
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,6144,2560,8,160,8,2,power_law_1.01,1.2884096145629882
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,6144,2560,8,160,8,2,power_law_1.01,0.07790719866752624
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,6144,2560,8,160,8,2,power_law_1.01,5.288627243041992
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,6144,2560,8,160,8,2,power_law_1.2,0.13594239950180054
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,6144,2560,8,160,8,2,power_law_1.01,1.781318473815918
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,6144,2560,8,160,8,2,power_law_1.01,0.10047999620437623
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,6144,2560,8,160,8,2,power_law_1.2,0.21627519130706788
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,6144,2560,8,160,8,2,power_law_1.01,0.11875840425491332
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,6144,2560,8,160,8,2,balanced,0.39290666580200195
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,6144,2560,8,160,8,2,power_law_1.01,2.395110321044922
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,6144,2560,8,160,8,2,power_law_1.01,0.15509120225906373
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,6144,2560,8,160,8,2,power_law_1.01,10.768927764892577
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,6144,2560,8,160,8,2,power_law_1.2,0.23420159816741942
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,6144,2560,8,160,8,2,power_law_1.01,0.17153919935226442
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,6144,2560,8,160,8,2,balanced,0.4510026772816976
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,6144,2560,8,160,8,2,power_law_1.01,2.8742464065551756
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,6144,2560,8,160,8,2,power_law_1.2,0.251910400390625
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,6144,2560,8,160,8,2,power_law_1.01,0.17583999633789063
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,6144,2560,8,160,8,2,power_law_1.01,0.18353919982910155
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,6144,2560,8,160,8,2,power_law_1.2,0.25690879821777346
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,6144,2560,8,160,8,2,power_law_1.01,4.391302490234375
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,6144,2560,8,160,8,2,power_law_1.01,0.19496320486068724
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,6144,2560,8,160,8,2,power_law_1.2,0.2693376064300537
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,6144,2560,8,160,8,2,power_law_1.01,0.2136512041091919
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,6144,2560,8,160,8,2,balanced,4.178079922993978
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,6144,2560,8,160,8,2,power_law_1.01,0.22245121002197266
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,6144,2560,8,160,8,2,power_law_1.2,0.27776639461517333
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,6144,2560,8,160,8,2,power_law_1.01,9.461312103271485
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,6144,2560,8,160,8,2,balanced,0.5890933275222778
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,6144,2560,8,160,8,2,power_law_1.01,0.24141440391540528
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,6144,2560,8,160,8,2,power_law_1.2,0.29271678924560546
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,6144,2560,8,160,8,2,power_law_1.01,0.2615423917770386
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,6144,2560,8,160,8,2,balanced,0.7013333638509115
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,6144,2560,8,160,8,2,power_law_1.01,0.29092481136322024
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,6144,2560,8,160,8,2,power_law_1.2,0.307859206199646
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,6144,2560,8,160,8,2,power_law_1.2,0.30382080078125
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,6144,2560,8,160,8,2,balanced,1.0528000195821126
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,6144,2560,8,160,8,2,power_law_1.01,0.2970495939254761
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,6144,2560,8,160,8,2,power_law_1.2,0.3265343904495239
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,6144,2560,8,160,8,2,power_law_1.2,0.3527679920196533
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,6144,2560,8,160,8,2,balanced,1.289749304453532
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,6144,2560,8,160,8,2,power_law_1.01,0.3332607984542847
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,6144,2560,8,160,8,2,power_law_1.2,0.36732161045074463
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,6144,2560,8,160,8,2,power_law_1.2,0.4288640022277832
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,6144,2560,8,160,8,2,power_law_1.01,0.4227263927459717
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,6144,2560,8,160,8,2,power_law_1.2,0.45963521003723146
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,6144,2560,8,160,8,2,balanced,1.8619146347045898
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,6144,2560,8,160,8,2,power_law_1.01,0.5089536190032959
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,6144,2560,8,160,8,2,power_law_1.2,0.5689280033111572
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,6144,2560,8,160,8,2,power_law_1.01,0.6776383876800537
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,6144,2560,8,160,8,2,power_law_1.2,0.6202816009521485
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,6144,2560,8,160,8,2,power_law_1.2,0.8164352416992188
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,6144,2560,8,160,8,2,power_law_1.01,0.827724838256836
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,6144,2560,8,160,8,2,power_law_1.2,1.009171199798584
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,6144,2560,8,160,8,2,power_law_1.01,1.094591999053955
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,6144,2560,8,160,8,2,balanced,2.4410667419433594
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,6144,2560,8,160,8,2,power_law_1.2,1.3788479804992675
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,6144,2560,8,160,8,2,power_law_1.01,1.3589823722839356
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,6144,2560,8,160,8,2,balanced,8.710122426350912
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,6144,2560,8,160,8,2,power_law_1.01,2.0087167739868166
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,6144,2560,8,160,8,2,power_law_1.2,1.7153280258178711
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,6144,2560,8,160,8,2,power_law_1.01,2.575974464416504
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,6144,2560,8,160,8,2,power_law_1.2,2.3964799880981444
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,6144,2560,8,160,8,2,power_law_1.01,3.795052719116211
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,6144,2560,8,160,8,2,power_law_1.2,2.86059513092041
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,6144,2560,8,160,8,2,power_law_1.01,4.89056625366211
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,6144,2560,8,160,8,2,balanced,3.4899466832478843
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,6144,2560,8,160,8,2,power_law_1.2,3.7067520141601564
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,6144,2560,8,160,8,2,power_law_1.01,6.101715087890625
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,6144,2560,8,160,8,2,power_law_1.01,10.080921936035157
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,6144,2560,8,160,8,2,power_law_1.2,5.815398406982422
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,6144,2560,8,160,8,2,balanced,8.166410446166992
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,6144,2560,8,160,8,2,power_law_1.01,21.24486389160156
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,6144,2560,8,160,8,2,power_law_1.2,12.340589141845703
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,6144,2560,8,160,8,2,balanced,4.658506711324056
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,6144,2560,8,160,8,2,balanced,5.6593812306722
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,6144,2560,8,160,8,2,power_law_1.2,0.05516800284385681
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,6144,2560,8,160,8,2,power_law_1.2,0.05399680137634277
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,6144,2560,8,160,8,2,power_law_1.2,0.0630400002002716
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,6144,2560,8,160,8,2,power_law_1.2,0.0807039976119995
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,6144,2560,8,160,8,2,power_law_1.2,0.10198400020599366
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,6144,2560,8,160,8,2,power_law_1.2,0.14817919731140136
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,6144,2560,8,160,8,2,power_law_1.2,0.15338239669799805
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,6144,2560,8,160,8,2,power_law_1.2,0.1619647979736328
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,6144,2560,8,160,8,2,power_law_1.2,0.16943360567092897
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,6144,2560,8,160,8,2,balanced,9.054927825927734
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,6144,2560,8,160,8,2,power_law_1.2,0.18150399923324584
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,6144,2560,8,160,8,2,power_law_1.2,0.18683520555496216
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,6144,2560,8,160,8,2,power_law_1.2,0.19895679950714112
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,6144,2560,8,160,8,2,power_law_1.2,0.21075201034545898
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,6144,2560,8,160,8,2,power_law_1.2,0.21555840969085693
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,6144,2560,8,160,8,2,power_law_1.2,0.22340478897094726
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,6144,2560,8,160,8,2,power_law_1.2,0.24330239295959472
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,6144,2560,8,160,8,2,power_law_1.2,0.2585024118423462
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,6144,2560,8,160,8,2,power_law_1.2,0.31049599647521975
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,6144,2560,8,160,8,2,power_law_1.2,0.32990078926086425
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,6144,2560,8,160,8,2,power_law_1.2,0.4253119945526123
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,6144,2560,8,160,8,2,power_law_1.2,0.48275198936462405
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,6144,2560,8,160,8,2,power_law_1.2,0.620582389831543
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,6144,2560,8,160,8,2,power_law_1.2,0.837286376953125
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,6144,2560,8,160,8,2,power_law_1.2,1.1982399940490722
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,6144,2560,8,160,8,2,power_law_1.2,1.4348544120788573
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,6144,2560,8,160,8,2,power_law_1.2,2.047808074951172
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,6144,2560,8,160,8,2,power_law_1.2,2.491596794128418
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,6144,2560,8,160,8,2,power_law_1.2,3.102726364135742
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,6144,2560,8,160,8,2,power_law_1.2,4.995923233032227
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,6144,2560,8,160,8,2,power_law_1.2,10.918515014648438
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,6144,2560,8,160,8,2,balanced,17.843029022216797
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,6144,2560,8,160,8,2,power_law_1.2,0.06995199918746949
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,6144,2560,8,160,16,1,balanced,0.06347199777762096
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,6144,2560,8,160,8,2,power_law_1.2,0.06933760046958923
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,6144,2560,8,160,16,1,balanced,0.07760533193747203
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,6144,2560,8,160,8,2,power_law_1.2,0.07808640003204345
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,6144,2560,8,160,8,2,power_law_1.2,0.08974080085754395
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,6144,2560,8,160,16,1,balanced,0.10039466619491577
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,6144,2560,8,160,8,2,power_law_1.2,0.11476479768753052
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,6144,2560,8,160,16,1,balanced,0.1521440049012502
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,6144,2560,8,160,8,2,power_law_1.2,0.15911680459976196
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,6144,2560,8,160,8,2,power_law_1.2,0.17237759828567506
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,6144,2560,8,160,16,1,balanced,0.2588106592496236
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,6144,2560,8,160,8,2,power_law_1.2,0.17482240200042726
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,6144,2560,8,160,16,1,balanced,0.30582932631174725
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,6144,2560,8,160,8,2,power_law_1.2,0.18934400081634523
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,6144,2560,8,160,8,2,power_law_1.2,0.2027519941329956
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,6144,2560,8,160,16,1,balanced,0.30796800057093304
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,6144,2560,8,160,8,2,power_law_1.2,0.2164031982421875
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,6144,2560,8,160,16,1,balanced,0.31441599130630493
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,6144,2560,8,160,8,2,power_law_1.2,0.22668159008026123
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,6144,2560,8,160,16,1,balanced,0.3138773242632548
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,6144,2560,8,160,8,2,power_law_1.2,0.24829440116882323
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,6144,2560,8,160,16,1,balanced,0.31861867507298786
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,6144,2560,8,160,8,2,power_law_1.2,0.26965761184692383
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,6144,2560,8,160,16,1,balanced,0.31834133466084796
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,6144,2560,8,160,8,2,power_law_1.2,0.2967744112014771
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,6144,2560,8,160,16,1,balanced,0.05412800113360087
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,6144,2560,8,160,16,1,balanced,0.32413333654403687
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,6144,2560,8,160,16,1,balanced,0.32788799206415814
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,6144,2560,8,160,16,1,balanced,0.06446399788061778
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,6144,2560,8,160,8,2,power_law_1.2,0.3050112009048462
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,6144,2560,8,160,16,1,balanced,0.07948266466458638
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,6144,2560,8,160,16,1,balanced,0.33834131558736164
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,6144,2560,8,160,16,1,balanced,0.12196800112724304
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,6144,2560,8,160,16,1,balanced,0.3490026791890462
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,6144,2560,8,160,16,1,balanced,0.18264534076054892
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,6144,2560,8,160,8,2,power_law_1.2,0.3391808032989502
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,6144,2560,8,160,16,1,balanced,0.35844798882802326
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,6144,2560,8,160,16,1,balanced,0.21568000316619873
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,6144,2560,8,160,16,1,balanced,0.37670934200286865
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,6144,2560,8,160,16,1,balanced,0.223855992158254
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,6144,2560,8,160,8,2,power_law_1.2,0.43720321655273436
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,6144,2560,8,160,16,1,balanced,0.22128534317016602
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,6144,2560,8,160,16,1,balanced,0.518725315729777
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,6144,2560,8,160,8,2,power_law_1.2,0.5121088027954102
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,6144,2560,8,160,16,1,balanced,0.22874132792154947
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,6144,2560,8,160,16,1,power_law_1.01,0.06041600108146668
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,6144,2560,8,160,16,1,balanced,0.4797866741816203
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,6144,2560,8,160,8,2,power_law_1.2,0.6749311923980713
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,6144,2560,8,160,16,1,balanced,0.2273226579030355
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,6144,2560,8,160,8,2,power_law_1.2,0.7925055980682373
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,6144,2560,8,160,16,1,power_law_1.01,0.0695680022239685
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,6144,2560,8,160,16,1,balanced,0.6303893327713013
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,6144,2560,8,160,16,1,balanced,0.2312320073445638
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,6144,2560,8,160,8,2,power_law_1.2,1.0662015914916991
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,6144,2560,8,160,16,1,power_law_1.01,0.08204159736633301
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,6144,2560,8,160,8,2,power_law_1.2,1.3936703681945801
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,6144,2560,8,160,16,1,balanced,0.23458133141199747
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,6144,2560,8,160,16,1,balanced,0.645365317662557
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,6144,2560,8,160,16,1,power_law_1.01,0.12407679557800293
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,6144,2560,8,160,8,2,power_law_1.2,2.193267250061035
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,6144,2560,8,160,16,1,balanced,0.2395306626955668
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,6144,2560,8,160,16,1,power_law_1.01,0.05185279846191406
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,6144,2560,8,160,16,1,power_law_1.01,0.16299519538879395
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,6144,2560,8,160,8,2,power_law_1.2,2.828633689880371
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,6144,2560,8,160,16,1,balanced,0.09401599566141765
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,6144,2560,8,160,16,1,balanced,0.2525493303934733
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,6144,2560,8,160,16,1,power_law_1.01,0.2472383975982666
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,6144,2560,8,160,16,1,balanced,1.0418079694112141
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,6144,2560,8,160,16,1,power_law_1.01,0.05971199870109558
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,6144,2560,8,160,8,2,power_law_1.2,4.209420776367187
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,6144,2560,8,160,16,1,balanced,0.2637919982274373
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,6144,2560,8,160,16,1,balanced,0.10248000423113506
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,6144,2560,8,160,16,1,power_law_1.01,0.2571135997772217
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,6144,2560,8,160,16,1,power_law_1.01,0.06887680292129517
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,6144,2560,8,160,8,2,power_law_1.2,5.317472076416015
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,6144,2560,8,160,16,1,balanced,0.11408000191052754
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,6144,2560,8,160,16,1,power_law_1.01,0.2722752094268799
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,6144,2560,8,160,16,1,balanced,0.2823359966278076
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,6144,2560,8,160,16,1,power_law_1.01,0.10090240240097045
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,6144,2560,8,160,8,2,power_law_1.2,6.221004867553711
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,6144,2560,8,160,16,1,balanced,1.0700639883677165
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,6144,2560,8,160,16,1,balanced,0.15432533621788025
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,6144,2560,8,160,16,1,power_law_1.01,0.12267520427703857
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,6144,2560,8,160,16,1,power_law_1.01,0.289900803565979
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,6144,2560,8,160,16,1,balanced,0.30131733417510986
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,6144,2560,8,160,16,1,balanced,0.21942933400472006
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,6144,2560,8,160,8,2,power_law_1.2,11.068576049804687
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,6144,2560,8,160,16,1,power_law_1.01,0.17461119890213012
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,6144,2560,8,160,16,1,power_law_1.01,0.28945920467376707
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,6144,2560,8,160,16,1,balanced,0.2574453353881836
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,6144,2560,8,160,16,1,balanced,0.43490668137868244
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,6144,2560,8,160,16,1,power_law_1.01,0.1885632038116455
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,6144,2560,8,160,16,1,power_law_1.01,0.28808319568634033
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,6144,2560,8,160,16,1,balanced,1.8814133008321126
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,6144,2560,8,160,16,1,balanced,0.26306132475535077
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,6144,2560,8,160,8,2,power_law_1.2,22.107501220703124
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,6144,2560,8,160,16,1,balanced,0.39025600751241046
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,6144,2560,8,160,16,1,power_law_1.01,0.19741439819335938
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,6144,2560,8,160,16,1,power_law_1.01,0.304422402381897
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,6144,2560,8,160,16,1,balanced,0.26848532756169635
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,6144,2560,8,160,16,1,balanced,0.27904532353083294
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,6144,2560,8,160,16,1,power_law_1.01,0.20415360927581788
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,6144,2560,8,160,16,1,power_law_1.01,0.31077120304107664
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,6144,2560,8,160,16,1,balanced,0.4965226650238037
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,6144,2560,8,160,16,1,balanced,0.2821919918060303
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,6144,2560,8,160,16,1,power_law_1.01,0.2126784086227417
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,6144,2560,8,160,16,1,power_law_1.01,0.3388864040374756
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,6144,2560,8,160,16,1,balanced,0.2943093379338582
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,6144,2560,8,160,16,1,balanced,2.0434346199035645
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,6144,2560,8,160,16,1,balanced,0.5444159905115763
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,6144,2560,8,160,16,1,power_law_1.01,0.22305920124053955
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,6144,2560,8,160,16,1,power_law_1.01,0.3709376096725464
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,6144,2560,8,160,16,1,balanced,0.30560533205668133
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,6144,2560,8,160,16,1,power_law_1.01,0.24365439414978027
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,6144,2560,8,160,16,1,power_law_1.01,0.3825792074203491
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,6144,2560,8,160,16,1,balanced,0.31833066542943317
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,6144,2560,8,160,16,1,balanced,0.8688053290049235
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,6144,2560,8,160,16,1,power_law_1.01,0.2547264099121094
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,6144,2560,8,160,16,1,power_law_1.01,0.41052799224853515
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,6144,2560,8,160,16,1,balanced,0.3420906861623128
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,6144,2560,8,160,16,1,power_law_1.01,0.25304958820343015
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,6144,2560,8,160,16,1,power_law_1.01,0.5101312160491943
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,6144,2560,8,160,16,1,balanced,0.36557865142822266
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,6144,2560,8,160,16,1,power_law_1.01,0.27733120918273924
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,6144,2560,8,160,16,1,balanced,1.0082720120747883
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,6144,2560,8,160,16,1,power_law_1.01,0.5390079975128174
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,6144,2560,8,160,16,1,balanced,3.0504480997721353
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,6144,2560,8,160,16,1,power_law_1.01,0.2979327917098999
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,6144,2560,8,160,16,1,power_law_1.01,0.6603839874267579
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,6144,2560,8,160,16,1,power_law_1.01,0.34011518955230713
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,6144,2560,8,160,16,1,power_law_1.01,0.7823679924011231
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,6144,2560,8,160,16,1,balanced,0.42127466201782227
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,6144,2560,8,160,16,1,power_law_1.01,0.41283202171325684
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,6144,2560,8,160,16,1,balanced,1.5750880241394043
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,6144,2560,8,160,16,1,power_law_1.01,0.9936127662658691
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,6144,2560,8,160,16,1,power_law_1.01,0.435807991027832
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,6144,2560,8,160,16,1,power_law_1.01,1.3972224235534667
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,6144,2560,8,160,16,1,power_law_1.01,0.5338624000549317
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,6144,2560,8,160,16,1,power_law_1.01,1.813644790649414
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,6144,2560,8,160,16,1,power_law_1.01,0.6444416046142578
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,6144,2560,8,160,16,1,balanced,0.476309339205424
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,6144,2560,8,160,16,1,power_law_1.01,2.1877695083618165
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,6144,2560,8,160,16,1,balanced,1.9360052744547527
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,6144,2560,8,160,16,1,power_law_1.01,0.8353792190551758
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,6144,2560,8,160,16,1,balanced,3.9239625930786133
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,6144,2560,8,160,16,1,power_law_1.01,3.1014528274536133
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,6144,2560,8,160,16,1,power_law_1.01,1.0780223846435546
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,6144,2560,8,160,16,1,power_law_1.01,4.072633743286133
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,6144,2560,8,160,16,1,power_law_1.01,1.49684476852417
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,6144,2560,8,160,16,1,power_law_1.01,1.9038528442382812
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,6144,2560,8,160,16,1,balanced,0.6341066757837931
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,6144,2560,8,160,16,1,power_law_1.01,4.968467330932617
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,6144,2560,8,160,16,1,power_law_1.01,2.7636224746704103
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,6144,2560,8,160,16,1,balanced,0.740277369817098
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,6144,2560,8,160,16,1,balanced,2.836432139078776
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,6144,2560,8,160,16,1,power_law_1.01,7.481452941894531
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,6144,2560,8,160,16,1,power_law_1.01,3.613625717163086
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,6144,2560,8,160,16,1,balanced,0.9859039783477783
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,6144,2560,8,160,16,1,power_law_1.01,4.4082176208496096
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,6144,2560,8,160,16,1,power_law_1.01,15.22503662109375
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,6144,2560,8,160,16,1,balanced,1.2083306312561035
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,6144,2560,8,160,16,1,balanced,4.478032112121582
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,6144,2560,8,160,16,1,power_law_1.01,6.811199951171875
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,6144,2560,8,160,16,1,balanced,1.8148159980773926
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,6144,2560,8,160,16,1,power_law_1.01,14.311570739746093
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,6144,2560,8,160,16,1,balanced,3.600645383199056
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,6144,2560,8,160,16,1,balanced,2.2596853574117026
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,6144,2560,8,160,16,1,balanced,3.2791306177775064
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,6144,2560,8,160,16,1,balanced,4.330666542053223
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,6144,2560,8,160,16,1,balanced,4.2281920115153
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,6144,2560,8,160,16,1,balanced,7.089701334635417
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,6144,2560,8,160,16,1,power_law_1.01,0.08375679850578308
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,6144,2560,8,160,16,1,power_law_1.01,0.09427840113639832
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,6144,2560,8,160,16,1,power_law_1.01,0.10747519731521607
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,6144,2560,8,160,16,1,balanced,6.224143981933594
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,6144,2560,8,160,16,1,power_law_1.2,0.0597055971622467
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,6144,2560,8,160,16,1,power_law_1.01,0.1310464024543762
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,6144,2560,8,160,16,1,power_law_1.01,0.15478399991989136
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,6144,2560,8,160,16,1,power_law_1.2,0.06499199867248535
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,6144,2560,8,160,16,1,power_law_1.01,0.2134399890899658
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,6144,2560,8,160,16,1,power_law_1.2,0.08289920091629029
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,6144,2560,8,160,16,1,power_law_1.01,0.22958719730377197
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,6144,2560,8,160,16,1,power_law_1.01,0.23941121101379395
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,6144,2560,8,160,16,1,power_law_1.2,0.11756800413131714
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,6144,2560,8,160,16,1,power_law_1.01,0.2562432050704956
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,6144,2560,8,160,16,1,power_law_1.2,0.15255039930343628
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,6144,2560,8,160,16,1,power_law_1.01,0.26545279026031493
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,6144,2560,8,160,16,1,power_law_1.01,0.2866431951522827
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,6144,2560,8,160,16,1,power_law_1.2,0.24318079948425292
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,6144,2560,8,160,16,1,power_law_1.01,0.30974080562591555
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,6144,2560,8,160,16,1,power_law_1.2,0.25320959091186523
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,6144,2560,8,160,16,1,balanced,8.280986785888672
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,6144,2560,8,160,16,1,power_law_1.01,0.3295167922973633
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,6144,2560,8,160,16,1,balanced,6.731589635213216
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,6144,2560,8,160,16,1,power_law_1.2,0.27596800327301024
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,6144,2560,8,160,16,1,power_law_1.01,0.37521278858184814
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,6144,2560,8,160,16,1,power_law_1.01,0.4217216014862061
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,6144,2560,8,160,16,1,power_law_1.2,0.2877952098846436
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,6144,2560,8,160,16,1,power_law_1.2,0.29166719913482664
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,6144,2560,8,160,16,1,power_law_1.2,0.29484798908233645
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,6144,2560,8,160,16,1,power_law_1.01,0.45121278762817385
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,6144,2560,8,160,16,1,power_law_1.2,0.31551361083984375
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,6144,2560,8,160,16,1,power_law_1.2,0.32486400604248045
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,6144,2560,8,160,16,1,power_law_1.2,0.3616192102432251
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,6144,2560,8,160,16,1,power_law_1.01,0.5165376186370849
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,6144,2560,8,160,16,1,power_law_1.2,0.3746687889099121
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,6144,2560,8,160,16,1,power_law_1.2,0.3953536033630371
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,6144,2560,8,160,16,1,balanced,10.149674733479818
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,6144,2560,8,160,16,1,power_law_1.2,0.4146304130554199
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,6144,2560,8,160,16,1,power_law_1.01,0.6435071945190429
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,6144,2560,8,160,16,1,power_law_1.01,0.7673535823822022
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,6144,2560,8,160,16,1,power_law_1.2,0.517190408706665
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,6144,2560,8,160,16,1,power_law_1.01,1.0268544197082519
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,6144,2560,8,160,16,1,power_law_1.2,0.5429376125335693
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,6144,2560,8,160,16,1,power_law_1.01,1.2737919807434082
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,6144,2560,8,160,16,1,balanced,14.253028869628906
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,6144,2560,8,160,16,1,power_law_1.2,0.6699776172637939
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,6144,2560,8,160,16,1,power_law_1.01,1.7559295654296876
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,6144,2560,8,160,16,1,power_law_1.01,2.2509632110595703
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,6144,2560,8,160,16,1,power_law_1.2,0.7970176219940186
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,6144,2560,8,160,16,1,power_law_1.01,3.2372032165527345
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,6144,2560,8,160,16,1,power_law_1.2,1.0138751983642578
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,6144,2560,8,160,16,1,power_law_1.01,4.230310440063477
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,6144,2560,8,160,16,1,power_law_1.2,1.4118847846984863
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,6144,2560,8,160,16,1,power_law_1.01,6.222035217285156
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,6144,2560,8,160,16,1,power_law_1.2,1.8934911727905273
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,6144,2560,8,160,16,1,power_law_1.01,8.197708892822266
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,6144,2560,8,160,16,1,power_law_1.2,2.229958343505859
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,6144,2560,8,160,16,1,power_law_1.2,0.05169919729232788
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,6144,2560,8,160,16,1,power_law_1.01,10.185209655761719
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,6144,2560,8,160,16,1,power_law_1.2,3.1738752365112304
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,6144,2560,8,160,16,1,power_law_1.2,0.0555840015411377
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,6144,2560,8,160,16,1,power_law_1.2,0.07050880193710327
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,6144,2560,8,160,16,1,power_law_1.2,4.137811279296875
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,6144,2560,8,160,16,1,power_law_1.01,16.13514862060547
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,6144,2560,8,160,16,1,balanced,16.23202641805013
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,6144,2560,8,160,16,1,power_law_1.2,0.09496319890022278
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,6144,2560,8,160,16,1,power_law_1.2,0.11407999992370606
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,6144,2560,8,160,16,1,power_law_1.2,5.216275024414062
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,6144,2560,8,160,16,1,power_law_1.2,0.1750656008720398
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,6144,2560,8,160,16,1,power_law_1.2,0.18665599822998047
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,6144,2560,8,160,16,1,balanced,13.483088175455729
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,6144,2560,8,160,16,1,power_law_1.2,7.843142700195313
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,6144,2560,8,160,16,1,power_law_1.01,32.05854797363281
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,6144,2560,8,160,16,1,power_law_1.2,0.20131199359893798
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,6144,2560,8,160,16,1,power_law_1.2,0.2095103979110718
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,6144,2560,8,160,16,1,power_law_1.2,0.2189311981201172
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,6144,2560,8,160,16,1,power_law_1.2,15.417100524902343
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,6144,2560,8,160,16,1,power_law_1.2,0.22837119102478026
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,6144,2560,8,160,16,1,power_law_1.2,0.25049600601196287
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,6144,2560,8,160,16,1,power_law_1.2,0.26163198947906496
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,6144,2560,8,160,16,1,power_law_1.2,0.26844799518585205
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,6144,2560,8,160,16,1,power_law_1.2,0.2859391927719116
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,6144,2560,8,160,16,1,power_law_1.2,0.3023103952407837
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,6144,2560,8,160,16,1,power_law_1.2,0.34161279201507566
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,6144,2560,8,160,16,1,power_law_1.2,0.4199039936065674
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,6144,2560,8,160,16,1,power_law_1.2,0.4433472156524658
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,6144,2560,8,160,16,1,power_law_1.2,0.5548223972320556
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,6144,2560,8,160,16,1,power_law_1.2,0.6518911838531494
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,6144,2560,8,160,16,1,power_law_1.2,0.8554816246032715
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,6144,2560,8,160,16,1,power_law_1.2,1.0948863983154298
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,6144,2560,8,160,16,1,power_law_1.2,1.5181183815002441
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,6144,2560,8,160,16,1,power_law_1.2,1.9421056747436523
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,6144,2560,8,160,16,1,power_law_1.2,2.792198371887207
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,6144,2560,8,160,16,1,power_law_1.2,3.702950286865234
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,6144,2560,8,160,16,1,power_law_1.2,4.62242546081543
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,6144,2560,8,160,16,1,power_law_1.2,7.215564727783203
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,6144,2560,8,160,16,1,balanced,32.23402659098307
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,6144,2560,8,160,16,1,power_law_1.2,14.553208923339843
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,7168,2048,8,384,1,16,balanced,0.08061866462230682
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,7168,2048,8,384,1,16,balanced,0.0817333310842514
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,7168,2048,8,384,1,16,balanced,0.08169066905975342
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,7168,2048,8,384,1,16,balanced,0.12463466326395671
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,6144,2560,8,160,16,1,power_law_1.2,0.08317440152168273
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,7168,2048,8,384,1,16,balanced,0.20278400182724
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,6144,2560,8,160,16,1,power_law_1.2,0.09497600197792053
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,7168,2048,8,384,1,16,balanced,0.36910398801167804
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,6144,2560,8,160,16,1,power_law_1.2,0.10565119981765747
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,7168,2048,8,384,1,16,balanced,0.5341813166936239
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,6144,2560,8,160,16,1,power_law_1.2,0.12556159496307373
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,7168,2048,8,384,1,16,balanced,0.5290666818618774
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,6144,2560,8,160,16,1,power_law_1.2,0.14639359712600708
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,7168,2048,8,384,1,16,balanced,0.5312639872233073
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,6144,2560,8,160,16,1,power_law_1.2,0.21137919425964355
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,7168,2048,8,384,1,16,balanced,0.5319093465805054
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,6144,2560,8,160,16,1,power_law_1.2,0.23147521018981934
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,7168,2048,8,384,1,16,balanced,0.531338651974996
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,6144,2560,8,160,16,1,power_law_1.2,0.2397183895111084
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,7168,2048,8,384,1,16,balanced,0.5326293309529623
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,6144,2560,8,160,16,1,power_law_1.2,0.25760641098022463
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,7168,2048,8,384,1,16,balanced,0.535647988319397
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,6144,2560,8,160,16,1,power_law_1.2,0.2772543907165527
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,7168,2048,8,384,1,16,balanced,0.5355519851048788
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,6144,2560,8,160,16,1,power_law_1.2,0.29367680549621583
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,7168,2048,8,384,1,16,balanced,0.5451146761576334
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,6144,2560,8,160,16,1,power_law_1.2,0.3181823968887329
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,6144,2560,8,160,16,1,power_law_1.2,0.33845760822296145
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,7168,2048,8,384,1,16,balanced,0.5434720118840536
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,6144,2560,8,160,16,1,power_law_1.2,0.37772159576416015
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,7168,2048,8,384,1,16,balanced,0.5507520039876302
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,6144,2560,8,160,16,1,power_law_1.2,0.428326416015625
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,7168,2048,8,384,1,16,balanced,0.5623039801915487
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,7168,2048,8,384,1,16,balanced,0.5954346656799316
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,6144,2560,8,160,16,1,power_law_1.2,0.4561920166015625
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,7168,2048,8,384,1,16,balanced,0.6140906810760498
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,7168,2048,8,384,1,16,balanced,0.6304906606674194
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,6144,2560,8,160,16,1,power_law_1.2,0.5203264236450196
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,7168,2048,8,384,1,16,balanced,0.6689600149790446
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,6144,2560,8,160,16,1,power_law_1.2,0.6488831996917724
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,6144,2560,8,160,16,1,power_law_1.2,0.7720831871032715
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,7168,2048,8,384,1,16,balanced,0.7275466918945312
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,6144,2560,8,160,16,1,power_law_1.2,1.0396736145019532
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,6144,2560,8,160,16,1,power_law_1.2,1.2823295593261719
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,6144,2560,8,160,16,1,power_law_1.2,1.7671871185302734
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,7168,2048,8,384,1,16,balanced,0.7980480194091797
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,6144,2560,8,160,16,1,power_law_1.2,2.256550407409668
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,7168,2048,8,384,1,16,balanced,0.055904000997543335
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,6144,2560,8,160,16,1,power_law_1.2,3.2460289001464844
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,7168,2048,8,384,1,16,balanced,0.059290667374928795
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,6144,2560,8,160,16,1,power_law_1.2,4.241523361206054
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,7168,2048,8,384,1,16,balanced,0.06353599826494853
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,7168,2048,8,384,1,16,balanced,0.08770133058230083
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,7168,2048,8,384,1,16,balanced,0.9968000253041586
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,6144,2560,8,160,16,1,power_law_1.2,6.232614517211914
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,7168,2048,8,384,1,16,balanced,0.12943466504414877
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,7168,2048,8,384,1,16,balanced,0.20800000429153442
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,6144,2560,8,160,16,1,power_law_1.2,8.221920013427734
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,7168,2048,8,384,1,16,balanced,0.2935466567675273
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,7168,2048,8,384,1,16,balanced,0.296015997727712
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,6144,2560,8,160,16,1,power_law_1.2,10.198271942138671
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,7168,2048,8,384,1,16,balanced,0.2945546706517537
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,7168,2048,8,384,1,16,balanced,0.2949013312657674
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,7168,2048,8,384,1,16,balanced,1.1294079621632893
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,7168,2048,8,384,1,16,balanced,0.29852267106374103
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,6144,2560,8,160,16,1,power_law_1.2,16.154783630371092
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,7168,2048,8,384,1,16,balanced,0.3014240066210429
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,7168,2048,8,384,1,16,balanced,0.3031253417332967
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,7168,2048,8,384,1,16,balanced,0.3049439986546834
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,6144,2560,8,160,16,1,power_law_1.2,32.09086608886719
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,7168,2048,8,384,1,16,balanced,0.3113386631011963
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,7168,2048,8,384,1,16,balanced,0.31495465834935504
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,7168,2048,8,384,1,16,power_law_1.01,0.22139520645141603
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,7168,2048,8,384,1,16,balanced,0.3229440053304036
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,7168,2048,8,384,1,16,balanced,1.5437706311543782
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,7168,2048,8,384,1,16,power_law_1.01,0.39105920791625975
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,7168,2048,8,384,1,16,balanced,0.3396746714909871
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,7168,2048,8,384,1,16,power_law_1.01,0.5251008033752441
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,7168,2048,8,384,1,16,balanced,0.3548106749852498
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,7168,2048,8,384,1,16,power_law_1.01,0.14994560480117797
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,7168,2048,8,384,1,16,balanced,0.3810986677805583
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,7168,2048,8,384,1,16,power_law_1.01,0.19041919708251953
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,7168,2048,8,384,1,16,power_law_1.01,0.3103552103042603
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,7168,2048,8,384,1,16,balanced,0.051594664653142296
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,7168,2048,8,384,1,16,balanced,0.40771734714508057
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,7168,2048,8,384,1,16,power_law_1.01,0.3260607957839966
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,7168,2048,8,384,1,16,power_law_1.01,0.1326591968536377
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,7168,2048,8,384,1,16,balanced,0.05171733101209005
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,7168,2048,8,384,1,16,balanced,0.06496533254782359
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,7168,2048,8,384,1,16,power_law_1.01,0.4086336135864258
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,7168,2048,8,384,1,16,balanced,0.45826133092244464
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,7168,2048,8,384,1,16,balanced,1.988378683725993
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,7168,2048,8,384,1,16,power_law_1.01,0.21132800579071045
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,7168,2048,8,384,1,16,balanced,0.0925439993540446
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,7168,2048,8,384,1,16,power_law_1.01,0.28434560298919676
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,7168,2048,8,384,1,16,power_law_1.01,0.4006656169891357
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,7168,2048,8,384,1,16,balanced,0.13876799742380777
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,7168,2048,8,384,1,16,power_law_1.01,0.10285439491271972
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,7168,2048,8,384,1,16,power_law_1.01,0.4486527919769287
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,7168,2048,8,384,1,16,balanced,0.2109066645304362
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,7168,2048,8,384,1,16,balanced,0.5179093281428019
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,7168,2048,8,384,1,16,power_law_1.01,0.13023359775543214
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,7168,2048,8,384,1,16,balanced,0.29547733068466187
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,7168,2048,8,384,1,16,power_law_1.01,0.1615872025489807
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,7168,2048,8,384,1,16,power_law_1.01,0.43809919357299804
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,7168,2048,8,384,1,16,balanced,0.29808000723520917
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,7168,2048,8,384,1,16,power_law_1.01,0.19555840492248536
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,7168,2048,8,384,1,16,power_law_1.01,0.4672704219818115
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,7168,2048,8,384,1,16,power_law_1.01,0.22101759910583496
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,7168,2048,8,384,1,16,balanced,0.29636265834172565
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,7168,2048,8,384,1,16,balanced,0.6128693421681722
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,7168,2048,8,384,1,16,power_law_1.01,0.2427903890609741
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,7168,2048,8,384,1,16,power_law_1.01,0.4383999824523926
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,7168,2048,8,384,1,16,balanced,0.29652265707651776
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,7168,2048,8,384,1,16,power_law_1.01,0.2383552074432373
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,7168,2048,8,384,1,16,balanced,0.2996053298314412
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,7168,2048,8,384,1,16,power_law_1.01,0.44504318237304685
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,7168,2048,8,384,1,16,power_law_1.01,0.2504192113876343
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,7168,2048,8,384,1,16,balanced,0.3015039960543315
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,7168,2048,8,384,1,16,power_law_1.01,0.5003520011901855
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,7168,2048,8,384,1,16,power_law_1.01,0.24432001113891602
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,7168,2048,8,384,1,16,balanced,0.30338666836420697
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,7168,2048,8,384,1,16,power_law_1.01,0.27835519313812257
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,7168,2048,8,384,1,16,power_law_1.01,0.5043839931488037
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,7168,2048,8,384,1,16,balanced,0.782912015914917
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,7168,2048,8,384,1,16,power_law_1.01,0.27543039321899415
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,7168,2048,8,384,1,16,balanced,0.3060800035794576
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,7168,2048,8,384,1,16,power_law_1.01,0.5456960201263428
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,7168,2048,8,384,1,16,power_law_1.01,0.2773823976516724
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,7168,2048,8,384,1,16,balanced,0.313482662041982
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,7168,2048,8,384,1,16,power_law_1.01,0.5963263988494873
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,7168,2048,8,384,1,16,power_law_1.01,0.29633920192718505
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,7168,2048,8,384,1,16,balanced,0.31571733951568604
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,7168,2048,8,384,1,16,power_law_1.01,0.6309120178222656
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,7168,2048,8,384,1,16,power_law_1.01,0.32673280239105223
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,7168,2048,8,384,1,16,balanced,2.905861218770345
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,7168,2048,8,384,1,16,balanced,0.32393066088358563
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,7168,2048,8,384,1,16,power_law_1.01,0.3766527891159058
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,7168,2048,8,384,1,16,power_law_1.01,0.7577536106109619
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,7168,2048,8,384,1,16,power_law_1.01,0.37500159740447997
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,7168,2048,8,384,1,16,power_law_1.01,0.8047807693481446
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,7168,2048,8,384,1,16,balanced,0.34163200855255127
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,7168,2048,8,384,1,16,balanced,0.9783679644266764
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,7168,2048,8,384,1,16,power_law_1.01,0.45533437728881837
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,7168,2048,8,384,1,16,power_law_1.01,1.0515007972717285
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,7168,2048,8,384,1,16,power_law_1.01,0.46939520835876464
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,7168,2048,8,384,1,16,power_law_1.01,0.9248767852783203
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,7168,2048,8,384,1,16,power_law_1.01,0.612505578994751
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,7168,2048,8,384,1,16,power_law_1.01,1.1790528297424316
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,7168,2048,8,384,1,16,power_law_1.01,0.6417151927947998
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,7168,2048,8,384,1,16,power_law_1.01,0.8255743980407715
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,7168,2048,8,384,1,16,power_law_1.01,1.557049560546875
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,384,1,16,balanced,0.35975468158721924
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,7168,2048,8,384,1,16,power_law_1.01,1.1317440032958985
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,7168,2048,8,384,1,16,power_law_1.2,0.22108159065246583
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,7168,2048,8,384,1,16,power_law_1.01,1.9924736022949219
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,7168,2048,8,384,1,16,power_law_1.01,1.5702848434448242
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,7168,2048,8,384,1,16,power_law_1.2,0.39025280475616453
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,7168,2048,8,384,1,16,power_law_1.01,2.507904052734375
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,7168,2048,8,384,1,16,power_law_1.01,2.0010175704956055
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,7168,2048,8,384,1,16,balanced,1.3160906632741292
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,7168,2048,8,384,1,16,power_law_1.2,0.23394560813903809
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,7168,2048,8,384,1,16,power_law_1.01,0.14321919679641723
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,7168,2048,8,384,1,16,power_law_1.01,2.2859392166137695
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,7168,2048,8,384,1,16,power_law_1.01,2.992959976196289
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,7168,2048,8,384,1,16,power_law_1.2,0.14482560157775878
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,7168,2048,8,384,1,16,power_law_1.01,0.21697919368743895
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,7168,2048,8,384,1,16,power_law_1.01,3.344723129272461
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,7168,2048,8,384,1,16,power_law_1.01,4.653337478637695
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,7168,2048,8,384,1,16,power_law_1.2,0.22605440616607667
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,7168,2048,8,384,1,16,power_law_1.01,0.2949696063995361
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,7168,2048,8,384,1,16,power_law_1.01,7.413919830322266
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,7168,2048,8,384,1,16,power_law_1.01,0.10295039415359497
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,7168,2048,8,384,1,16,power_law_1.2,0.26565120220184324
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,384,1,16,balanced,0.3998773495356242
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,7168,2048,8,384,1,16,power_law_1.01,8.632621002197265
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,7168,2048,8,384,1,16,power_law_1.01,0.14647040367126465
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,7168,2048,8,384,1,16,power_law_1.2,0.3086591958999634
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,7168,2048,8,384,1,16,power_law_1.01,0.19301120042800904
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,384,1,16,balanced,0.42924265066782635
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,7168,2048,8,384,1,16,power_law_1.2,0.3589951992034912
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,7168,2048,8,384,1,16,power_law_1.01,0.18908159732818602
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,7168,2048,8,384,1,16,power_law_1.2,0.42664318084716796
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,7168,2048,8,384,1,16,balanced,1.6627626419067383
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,384,1,16,balanced,0.4840159813563029
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,7168,2048,8,384,1,16,power_law_1.01,0.2352832078933716
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,7168,2048,8,384,1,16,power_law_1.2,0.43420162200927737
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,7168,2048,8,384,1,16,power_law_1.01,0.2416383981704712
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,7168,2048,8,384,1,16,power_law_1.2,0.38955519199371336
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,7168,2048,8,384,1,16,power_law_1.01,0.24566400051116943
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,7168,2048,8,384,1,16,power_law_1.2,0.4590015888214111
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,7168,2048,8,384,1,16,power_law_1.01,0.25920639038085935
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,7168,2048,8,384,1,16,power_law_1.2,0.45308799743652345
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,7168,2048,8,384,1,16,power_law_1.01,0.2547327995300293
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,384,1,16,balanced,0.5773813327153524
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,7168,2048,8,384,1,16,power_law_1.2,0.4757120132446289
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,7168,2048,8,384,1,16,balanced,5.349434534708659
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,7168,2048,8,384,1,16,power_law_1.01,0.28224639892578124
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,7168,2048,8,384,1,16,power_law_1.2,0.5023935794830322
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,7168,2048,8,384,1,16,power_law_1.01,0.29840641021728515
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,7168,2048,8,384,1,16,power_law_1.2,0.5087552070617676
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,7168,2048,8,384,1,16,power_law_1.01,0.32391040325164794
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,384,1,16,balanced,0.6975893179575602
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,7168,2048,8,384,1,16,power_law_1.2,0.5404543876647949
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,7168,2048,8,384,1,16,power_law_1.01,0.337228798866272
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,7168,2048,8,384,1,16,power_law_1.2,0.6570752143859864
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,7168,2048,8,384,1,16,power_law_1.01,0.360319995880127
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,7168,2048,8,384,1,16,power_law_1.2,0.6660096168518066
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,7168,2048,8,384,1,16,balanced,2.500037352244059
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,7168,2048,8,384,1,16,power_law_1.01,0.44659838676452634
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,7168,2048,8,384,1,16,power_law_1.2,0.8663935661315918
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,384,1,16,balanced,1.002842664718628
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,7168,2048,8,384,1,16,power_law_1.2,0.9091263771057129
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,384,1,16,power_law_1.01,0.4553088188171387
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,7168,2048,8,384,1,16,power_law_1.2,1.1101119995117188
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,7168,2048,8,384,1,16,power_law_1.2,1.1009407997131349
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,384,1,16,power_law_1.01,0.49288320541381836
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,7168,2048,8,384,1,16,power_law_1.2,1.3276608467102051
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,384,1,16,power_law_1.01,0.547046422958374
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,384,1,16,balanced,1.2651413281758626
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,7168,2048,8,384,1,16,power_law_1.2,1.8035263061523437
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,384,1,16,power_law_1.01,0.7728960037231445
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,7168,2048,8,384,1,16,power_law_1.2,2.4696767807006834
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,384,1,16,power_law_1.01,0.8354496002197266
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,7168,2048,8,384,1,16,power_law_1.2,3.006278419494629
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,384,1,16,power_law_1.01,1.1559167861938477
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,7168,2048,8,384,1,16,power_law_1.2,3.711251068115234
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,384,1,16,power_law_1.01,1.5104384422302246
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,7168,2048,8,384,1,16,power_law_1.2,5.698412704467773
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,384,1,16,power_law_1.01,2.1238143920898436
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,384,1,16,balanced,1.7451252937316895
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,384,1,16,power_law_1.01,2.5972991943359376
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,7168,2048,8,384,1,16,power_law_1.2,12.049139404296875
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,384,1,16,power_law_1.01,3.413119888305664
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,7168,2048,8,384,1,16,power_law_1.2,0.13331199884414674
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,384,1,16,power_law_1.01,5.7210945129394535
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,7168,2048,8,384,1,16,power_law_1.2,0.21644799709320067
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,7168,2048,8,384,1,16,power_law_1.2,0.20869760513305663
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,384,1,16,power_law_1.01,10.941395568847657
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,7168,2048,8,384,1,16,power_law_1.2,0.09664000272750854
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,7168,2048,8,384,1,16,power_law_1.2,0.12903679609298707
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,384,1,16,balanced,2.2147839864095054
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,7168,2048,8,384,1,16,balanced,4.742010752360026
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,7168,2048,8,384,1,16,power_law_1.2,0.15960320234298705
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,7168,2048,8,384,1,16,power_law_1.2,0.1672767996788025
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,7168,2048,8,384,1,16,power_law_1.2,0.20730879306793212
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,7168,2048,8,384,1,16,power_law_1.2,0.23697280883789062
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,7168,2048,8,384,1,16,power_law_1.2,0.2275712013244629
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,7168,2048,8,384,1,16,power_law_1.2,0.23710079193115235
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,7168,2048,8,384,1,16,power_law_1.2,0.24941439628601075
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,7168,2048,8,384,1,16,power_law_1.2,0.24161279201507568
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,7168,2048,8,384,1,16,power_law_1.2,0.26871678829193113
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,7168,2048,8,384,1,16,power_law_1.2,0.2928191900253296
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,384,1,16,balanced,3.4073012669881186
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,7168,2048,8,384,1,16,power_law_1.2,0.317305588722229
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,7168,2048,8,384,1,16,power_law_1.2,0.32969601154327394
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,7168,2048,8,384,1,16,power_law_1.2,0.37160320281982423
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,7168,2048,8,384,1,16,power_law_1.2,0.3919296026229858
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,7168,2048,8,384,1,16,power_law_1.2,0.4965695858001709
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,7168,2048,8,384,1,16,power_law_1.2,0.5296639919281005
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,7168,2048,8,384,1,16,power_law_1.2,0.64901762008667
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,7168,2048,8,384,1,16,power_law_1.2,0.6820288181304932
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,7168,2048,8,384,1,16,power_law_1.2,0.9319040298461914
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,7168,2048,8,384,1,16,power_law_1.2,1.191596794128418
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,7168,2048,8,384,1,16,power_law_1.2,1.895782470703125
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,7168,2048,8,384,1,16,power_law_1.2,2.1244224548339843
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,7168,2048,8,384,1,16,power_law_1.2,2.8040895462036133
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,7168,2048,8,384,1,16,power_law_1.2,4.386361694335937
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,7168,2048,8,384,1,16,power_law_1.2,8.84286117553711
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,7168,2048,8,384,1,16,power_law_1.2,0.143340802192688
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,7168,2048,8,384,1,16,power_law_1.2,0.216428804397583
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,7168,2048,8,384,2,8,balanced,0.061093335350354515
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,7168,2048,8,384,1,16,power_law_1.2,0.2066879987716675
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,7168,2048,8,384,2,8,balanced,0.06576533118883769
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,7168,2048,8,384,2,8,balanced,0.08238933483759563
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,7168,2048,8,384,1,16,power_law_1.2,0.09683200120925903
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,7168,2048,8,384,2,8,balanced,0.12609066565831503
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,7168,2048,8,384,1,16,power_law_1.2,0.1214784026145935
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,384,1,16,balanced,6.597696304321289
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,7168,2048,8,384,2,8,balanced,0.20336532592773438
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,7168,2048,8,384,1,16,power_law_1.2,0.14953600168228148
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,7168,2048,8,384,2,8,balanced,0.3721919854482015
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,7168,2048,8,384,1,16,power_law_1.2,0.17832959890365602
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,7168,2048,8,384,2,8,balanced,0.5318880081176758
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,7168,2048,8,384,1,16,power_law_1.2,0.20830080509185792
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,7168,2048,8,384,2,8,balanced,0.05035200218359629
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,7168,2048,8,384,2,8,balanced,0.5295999844868978
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,7168,2048,8,384,1,16,power_law_1.2,0.2103872060775757
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,7168,2048,8,384,2,8,balanced,0.052416001756985985
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,7168,2048,8,384,2,8,balanced,0.5308586756388346
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,7168,2048,8,384,2,8,balanced,0.06319466729958852
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,7168,2048,8,384,1,16,power_law_1.2,0.231276798248291
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,7168,2048,8,384,2,8,balanced,0.5324960152308146
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,7168,2048,8,384,2,8,balanced,0.08880533774693807
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,7168,2048,8,384,1,16,power_law_1.2,0.24446721076965333
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,7168,2048,8,384,2,8,balanced,0.5324639876683553
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,7168,2048,8,384,2,8,balanced,0.1302239994208018
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,7168,2048,8,384,2,8,balanced,0.5352586507797241
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,7168,2048,8,384,1,16,power_law_1.2,0.25938560962677004
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,7168,2048,8,384,2,8,balanced,0.21253333489100137
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,7168,2048,8,384,2,8,balanced,0.5379466613133749
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,7168,2048,8,384,2,8,balanced,0.2945386568705241
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,7168,2048,8,384,1,16,power_law_1.2,0.2787071943283081
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,7168,2048,8,384,2,8,balanced,0.5403093496958414
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,7168,2048,8,384,2,8,balanced,0.29607999324798584
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,7168,2048,8,384,1,16,power_law_1.2,0.2973376035690308
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,7168,2048,8,384,2,8,balanced,0.5483786662419637
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,7168,2048,8,384,2,8,balanced,0.2956906755765279
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,7168,2048,8,384,1,16,power_law_1.2,0.33511040210723875
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,7168,2048,8,384,2,8,balanced,0.5506346623102824
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,7168,2048,8,384,2,8,balanced,0.29690666993459064
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,7168,2048,8,384,1,16,power_law_1.2,0.3317631959915161
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,7168,2048,8,384,2,8,balanced,0.5585226615269979
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,7168,2048,8,384,2,8,balanced,0.3001280029614766
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,7168,2048,8,384,1,16,power_law_1.2,0.3797440052032471
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,7168,2048,8,384,2,8,balanced,0.3033919930458069
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,7168,2048,8,384,2,8,balanced,0.5718880097071329
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,7168,2048,8,384,2,8,balanced,0.304970661799113
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,7168,2048,8,384,1,16,power_law_1.2,0.45578880310058595
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,7168,2048,8,384,2,8,balanced,0.6004106601079305
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,7168,2048,8,384,2,8,balanced,0.3093386689821879
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,7168,2048,8,384,2,8,balanced,0.625653346379598
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,7168,2048,8,384,2,8,balanced,0.3185653289159139
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,384,1,16,power_law_1.2,0.4824512004852295
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,7168,2048,8,384,2,8,balanced,0.3258986671765645
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,7168,2048,8,384,2,8,balanced,0.6475253502527872
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,7168,2048,8,384,2,8,balanced,0.33023999134699505
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,384,1,16,power_law_1.2,0.5264959812164307
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,7168,2048,8,384,2,8,balanced,0.6959786415100098
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,7168,2048,8,384,2,8,balanced,0.346837321917216
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,384,1,16,power_law_1.2,0.6570943832397461
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,7168,2048,8,384,2,8,balanced,0.36285332838694256
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,384,1,16,power_law_1.2,0.8309696197509766
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,7168,2048,8,384,2,8,balanced,0.7633600234985352
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,7168,2048,8,384,2,8,balanced,0.39502934614817303
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,384,1,16,power_law_1.2,0.9573311805725098
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,7168,2048,8,384,2,8,balanced,0.43562666575113934
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,7168,2048,8,384,2,8,balanced,0.857151985168457
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,384,1,16,power_law_1.2,1.212934398651123
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,7168,2048,8,384,2,8,balanced,0.5011786619822184
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,384,1,16,power_law_1.2,1.8500799179077148
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,384,1,16,power_law_1.2,2.7802303314208983
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,7168,2048,8,384,2,8,balanced,0.05218133330345154
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,7168,2048,8,384,2,8,balanced,0.5630773305892944
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,7168,2048,8,384,2,8,power_law_1.01,0.13100800514221192
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,7168,2048,8,384,2,8,balanced,1.066101312637329
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,384,1,16,power_law_1.2,3.135219192504883
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,7168,2048,8,384,2,8,balanced,0.05816533168156942
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,7168,2048,8,384,2,8,power_law_1.01,0.0877568006515503
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,7168,2048,8,384,2,8,power_law_1.01,0.20078721046447753
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,7168,2048,8,384,2,8,balanced,0.06885866820812225
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,384,1,16,power_law_1.2,3.742067337036133
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,7168,2048,8,384,2,8,power_law_1.01,0.1220479965209961
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,7168,2048,8,384,2,8,balanced,0.09569066762924194
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,7168,2048,8,384,2,8,power_law_1.01,0.35790719985961916
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,7168,2048,8,384,2,8,balanced,0.14108266433080038
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,7168,2048,8,384,2,8,balanced,0.6832106908162435
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,7168,2048,8,384,2,8,power_law_1.01,0.20268800258636474
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,7168,2048,8,384,2,8,power_law_1.01,0.12842880487442015
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,7168,2048,8,384,2,8,balanced,0.21659733851750693
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,384,1,16,power_law_1.2,5.829856109619141
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,7168,2048,8,384,2,8,power_law_1.01,0.1011199951171875
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,7168,2048,8,384,2,8,balanced,0.2974560062090556
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,7168,2048,8,384,2,8,power_law_1.01,0.17509119510650634
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,7168,2048,8,384,2,8,balanced,1.26145601272583
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,7168,2048,8,384,2,8,balanced,0.29794132709503174
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,7168,2048,8,384,2,8,power_law_1.01,0.11809920072555542
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,7168,2048,8,384,2,8,power_law_1.01,0.2772864103317261
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,7168,2048,8,384,2,8,balanced,0.30083199342091876
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,384,1,16,power_law_1.2,17.079930114746094
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,7168,2048,8,384,2,8,power_law_1.01,0.1630911946296692
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,7168,2048,8,384,2,8,balanced,0.30078399181365967
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,7168,2048,8,384,2,8,balanced,0.8747946421305338
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,7168,2048,8,384,2,8,power_law_1.01,0.3050368070602417
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,7168,2048,8,384,2,8,power_law_1.01,0.17211519479751586
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,7168,2048,8,384,2,8,balanced,0.3036959966023763
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,7168,2048,8,384,2,8,balanced,0.3066506584485372
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,7168,2048,8,384,2,8,power_law_1.01,0.380185604095459
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,7168,2048,8,384,2,8,power_law_1.01,0.20510718822479249
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,7168,2048,8,384,2,8,balanced,0.31086399157842
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,7168,2048,8,384,2,8,power_law_1.01,0.3562304019927979
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,7168,2048,8,384,2,8,power_law_1.01,0.22378880977630616
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,7168,2048,8,384,2,8,balanced,0.3144426743189494
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,7168,2048,8,384,2,8,power_law_1.01,0.39276800155639646
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,7168,2048,8,384,2,8,balanced,0.3253119985262553
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,7168,2048,8,384,2,8,power_law_1.01,0.21653120517730712
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,7168,2048,8,384,2,8,balanced,0.3293173313140869
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,7168,2048,8,384,2,8,balanced,1.7041600545247395
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,7168,2048,8,384,2,8,power_law_1.01,0.438259220123291
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,7168,2048,8,384,2,8,power_law_1.01,0.24522879123687744
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,7168,2048,8,384,2,8,balanced,1.116634686787923
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,7168,2048,8,384,2,8,balanced,0.34030401706695557
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,7168,2048,8,384,2,8,power_law_1.01,0.45438079833984374
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,7168,2048,8,384,2,8,power_law_1.01,0.2428607940673828
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,7168,2048,8,384,2,8,balanced,0.36640000343322754
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,7168,2048,8,384,2,8,power_law_1.01,0.46791682243347166
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,7168,2048,8,384,2,8,power_law_1.01,0.24344959259033203
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,7168,2048,8,384,2,8,power_law_1.01,0.43089280128479
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,7168,2048,8,384,2,8,power_law_1.01,0.2528320074081421
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,7168,2048,8,384,2,8,power_law_1.01,0.4813248157501221
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,7168,2048,8,384,2,8,power_law_1.01,0.2835903882980347
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,7168,2048,8,384,2,8,power_law_1.01,0.47487359046936034
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,7168,2048,8,384,2,8,power_law_1.01,0.27381119728088377
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,7168,2048,8,384,2,8,power_law_1.01,0.5107967853546143
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,7168,2048,8,384,2,8,power_law_1.01,0.29373440742492674
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,384,2,8,balanced,0.3922826846440633
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,7168,2048,8,384,2,8,power_law_1.01,0.3487488031387329
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,7168,2048,8,384,2,8,power_law_1.01,0.5553855895996094
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,7168,2048,8,384,2,8,balanced,1.5109705924987793
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,7168,2048,8,384,2,8,power_law_1.01,0.37178239822387693
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,7168,2048,8,384,2,8,power_law_1.01,0.618617582321167
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,7168,2048,8,384,2,8,balanced,2.257333278656006
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,7168,2048,8,384,2,8,power_law_1.01,0.7042623996734619
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,7168,2048,8,384,2,8,power_law_1.01,0.45311999320983887
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,7168,2048,8,384,2,8,power_law_1.01,0.8077504158020019
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,7168,2048,8,384,2,8,power_law_1.01,0.48339200019836426
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,7168,2048,8,384,2,8,power_law_1.01,0.9218048095703125
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,7168,2048,8,384,2,8,power_law_1.01,0.625216007232666
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,7168,2048,8,384,2,8,power_law_1.01,0.9226431846618652
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,7168,2048,8,384,2,8,power_law_1.01,0.6738048076629639
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,7168,2048,8,384,2,8,power_law_1.01,1.156383991241455
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,384,2,8,balanced,0.44649600982666016
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,7168,2048,8,384,2,8,power_law_1.01,0.8717184066772461
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,7168,2048,8,384,2,8,power_law_1.01,1.597715187072754
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,7168,2048,8,384,2,8,power_law_1.01,1.111251163482666
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,7168,2048,8,384,2,8,power_law_1.01,1.9542207717895508
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,384,2,8,balanced,0.5010559956232706
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,7168,2048,8,384,2,8,balanced,1.8650612831115723
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,7168,2048,8,384,2,8,power_law_1.01,1.4881919860839843
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,7168,2048,8,384,2,8,power_law_1.01,2.450259208679199
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,7168,2048,8,384,2,8,power_law_1.01,1.7805952072143554
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,384,2,8,balanced,0.5885706742604574
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,7168,2048,8,384,2,8,power_law_1.01,2.8343807220458985
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,7168,2048,8,384,2,8,power_law_1.01,2.1546560287475587
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,7168,2048,8,384,2,8,power_law_1.01,4.563103866577149
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,7168,2048,8,384,2,8,power_law_1.01,3.6076416015625
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,384,2,8,balanced,0.7267253398895264
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,7168,2048,8,384,2,8,power_law_1.01,8.667897796630859
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,7168,2048,8,384,2,8,balanced,3.228245417277018
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,7168,2048,8,384,2,8,power_law_1.01,6.741011047363282
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,384,2,8,balanced,0.9019467035929362
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,7168,2048,8,384,2,8,power_law_1.01,0.10016000270843506
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,384,2,8,balanced,1.2900853157043457
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,7168,2048,8,384,2,8,power_law_1.01,0.1384384036064148
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,7168,2048,8,384,2,8,power_law_1.01,0.2210752010345459
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,7168,2048,8,384,2,8,balanced,2.8512001037597656
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,7168,2048,8,384,2,8,power_law_1.01,0.09268479943275451
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,7168,2048,8,384,2,8,power_law_1.2,0.13210879564285277
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,7168,2048,8,384,2,8,power_law_1.01,0.1314560055732727
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,7168,2048,8,384,2,8,power_law_1.01,0.158297598361969
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,7168,2048,8,384,2,8,power_law_1.2,0.20067839622497557
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,384,2,8,balanced,1.6525440216064453
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,7168,2048,8,384,2,8,power_law_1.01,0.1861567974090576
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,7168,2048,8,384,2,8,power_law_1.2,0.19067519903182983
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,7168,2048,8,384,2,8,power_law_1.01,0.22284159660339356
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,7168,2048,8,384,2,8,power_law_1.2,0.11996159553527833
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,7168,2048,8,384,2,8,power_law_1.01,0.22958719730377197
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,7168,2048,8,384,2,8,power_law_1.2,0.16922240257263182
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,7168,2048,8,384,2,8,power_law_1.01,0.23074560165405272
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,7168,2048,8,384,2,8,power_law_1.2,0.2545151948928833
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,7168,2048,8,384,2,8,power_law_1.01,0.23966081142425538
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,7168,2048,8,384,2,8,power_law_1.2,0.25922560691833496
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,7168,2048,8,384,2,8,power_law_1.01,0.27670400142669677
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,384,2,8,balanced,2.2781333923339844
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,7168,2048,8,384,2,8,power_law_1.2,0.38064000606536863
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,7168,2048,8,384,2,8,power_law_1.01,0.28866560459136964
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,7168,2048,8,384,2,8,power_law_1.2,0.38100481033325195
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,7168,2048,8,384,2,8,power_law_1.01,0.28698880672454835
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,7168,2048,8,384,2,8,power_law_1.2,0.3742847919464111
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,7168,2048,8,384,2,8,power_law_1.01,0.3122560024261475
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,7168,2048,8,384,2,8,power_law_1.2,0.4128704071044922
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,7168,2048,8,384,2,8,power_law_1.01,0.3263040065765381
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,7168,2048,8,384,2,8,power_law_1.2,0.44820480346679686
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,7168,2048,8,384,2,8,power_law_1.01,0.36306560039520264
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,7168,2048,8,384,2,8,balanced,5.969573338826497
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,7168,2048,8,384,2,8,power_law_1.2,0.4381824016571045
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,7168,2048,8,384,2,8,power_law_1.01,0.425216007232666
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,7168,2048,8,384,2,8,power_law_1.2,0.47711358070373533
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,384,2,8,balanced,2.890714645385742
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,7168,2048,8,384,2,8,power_law_1.2,0.500761604309082
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,384,2,8,power_law_1.01,0.4540736198425293
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,7168,2048,8,384,2,8,power_law_1.2,0.4916672229766846
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,7168,2048,8,384,2,8,power_law_1.2,0.5198783874511719
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,384,2,8,power_law_1.01,0.5011072158813477
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,7168,2048,8,384,2,8,power_law_1.2,0.6031487941741943
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,7168,2048,8,384,2,8,balanced,5.371573130289714
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,384,2,8,power_law_1.01,0.6139840126037598
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,7168,2048,8,384,2,8,power_law_1.2,0.6509632110595703
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,7168,2048,8,384,2,8,power_law_1.2,0.7702720165252686
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,384,2,8,power_law_1.01,0.7981311798095703
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,7168,2048,8,384,2,8,power_law_1.2,0.8081664085388184
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,384,2,8,power_law_1.01,0.9464127540588378
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,7168,2048,8,384,2,8,power_law_1.2,1.0187968254089355
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,384,2,8,power_law_1.01,1.2657983779907227
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,7168,2048,8,384,2,8,power_law_1.2,0.9665920257568359
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,384,2,8,power_law_1.01,1.6753599166870117
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,7168,2048,8,384,2,8,power_law_1.2,1.2857024192810058
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,384,2,8,balanced,4.430469195048015
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,384,2,8,power_law_1.01,2.235366439819336
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,7168,2048,8,384,2,8,power_law_1.2,1.6572799682617188
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,7168,2048,8,384,2,8,power_law_1.2,2.157638359069824
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,384,2,8,power_law_1.01,3.154195213317871
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,7168,2048,8,384,2,8,power_law_1.2,2.56112003326416
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,384,2,8,power_law_1.01,3.595654296875
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,7168,2048,8,384,2,8,power_law_1.2,3.1631807327270507
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,7168,2048,8,384,2,8,power_law_1.2,0.08288000226020813
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,384,2,8,power_law_1.01,5.783935928344727
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,7168,2048,8,384,2,8,power_law_1.2,0.12215039730072022
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,7168,2048,8,384,2,8,power_law_1.2,4.754374313354492
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,7168,2048,8,384,2,8,power_law_1.2,0.10540159940719604
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,384,2,8,power_law_1.01,12.188185882568359
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,7168,2048,8,384,2,8,power_law_1.2,0.08373759984970093
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,7168,2048,8,384,2,8,power_law_1.2,9.23971176147461
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,7168,2048,8,384,2,8,power_law_1.2,0.11591039896011353
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,7168,2048,8,384,2,8,power_law_1.2,0.14387840032577515
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,7168,2048,8,384,2,8,power_law_1.2,0.17172479629516602
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,7168,2048,8,384,2,8,power_law_1.2,0.20787200927734376
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,7168,2048,8,384,2,8,power_law_1.2,0.21532158851623534
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,7168,2048,8,384,2,8,power_law_1.2,0.22272639274597167
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,7168,2048,8,384,2,8,power_law_1.2,0.2425856113433838
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,7168,2048,8,384,2,8,power_law_1.2,0.24117119312286378
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,7168,2048,8,384,2,8,power_law_1.2,0.25126399993896487
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,7168,2048,8,384,2,8,power_law_1.2,0.2596927881240845
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,384,2,8,balanced,8.641701380411783
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,7168,2048,8,384,2,8,power_law_1.2,0.28095359802246095
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,7168,2048,8,384,2,8,power_law_1.2,0.2861824035644531
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,7168,2048,8,384,2,8,power_law_1.2,0.2893824100494385
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,7168,2048,8,384,2,8,power_law_1.2,0.35325438976287843
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,7168,2048,8,384,2,8,power_law_1.2,0.3818624019622803
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,7168,2048,8,384,2,8,power_law_1.2,0.47731838226318357
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,7168,2048,8,384,2,8,power_law_1.2,0.512179183959961
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,7168,2048,8,384,2,8,power_law_1.2,0.6445824146270752
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,7168,2048,8,384,4,4,balanced,0.05955733358860016
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,7168,2048,8,384,2,8,power_law_1.2,0.7143295764923095
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,7168,2048,8,384,4,4,balanced,0.06679999828338623
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,7168,2048,8,384,4,4,balanced,0.08267733454704285
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,7168,2048,8,384,2,8,power_law_1.2,0.9902848243713379
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,7168,2048,8,384,2,8,power_law_1.2,0.09559040069580078
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,7168,2048,8,384,4,4,balanced,0.12853333353996277
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,7168,2048,8,384,2,8,power_law_1.2,1.218073558807373
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,7168,2048,8,384,2,8,power_law_1.2,0.13791359663009645
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,7168,2048,8,384,4,4,balanced,0.20288532972335815
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,7168,2048,8,384,2,8,power_law_1.2,1.5850048065185547
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,7168,2048,8,384,4,4,balanced,0.37145598729451496
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,7168,2048,8,384,2,8,power_law_1.2,0.11752959489822387
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,7168,2048,8,384,4,4,balanced,0.532975991566976
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,7168,2048,8,384,2,8,power_law_1.2,2.0457408905029295
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,7168,2048,8,384,2,8,power_law_1.2,0.08919680118560791
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,7168,2048,8,384,4,4,balanced,0.5410986741383871
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,7168,2048,8,384,2,8,power_law_1.2,0.12198400497436523
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,7168,2048,8,384,2,8,power_law_1.2,2.7914623260498046
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,7168,2048,8,384,4,4,balanced,0.5404853423436483
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,7168,2048,8,384,2,8,power_law_1.2,0.1531775951385498
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,7168,2048,8,384,4,4,balanced,0.5475093523661295
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,7168,2048,8,384,2,8,power_law_1.2,4.394739151000977
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,7168,2048,8,384,4,4,balanced,0.5416426658630371
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,7168,2048,8,384,2,8,power_law_1.2,0.17331199645996093
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,7168,2048,8,384,4,4,balanced,0.5434773365656534
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,7168,2048,8,384,2,8,power_law_1.2,0.20307838916778564
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,7168,2048,8,384,2,8,power_law_1.2,7.686297607421875
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,7168,2048,8,384,4,4,balanced,0.5446773370107015
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,7168,2048,8,384,2,8,power_law_1.2,0.21772799491882325
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,7168,2048,8,384,4,4,balanced,0.5530346632003784
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,7168,2048,8,384,2,8,power_law_1.2,0.22140159606933593
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,7168,2048,8,384,4,4,balanced,0.5624320109685262
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,7168,2048,8,384,2,8,power_law_1.2,0.23311359882354737
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,7168,2048,8,384,4,4,balanced,0.5682933330535889
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,7168,2048,8,384,2,8,power_law_1.2,0.26299519538879396
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,7168,2048,8,384,4,4,balanced,0.5757866700490316
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,7168,2048,8,384,2,8,power_law_1.2,0.2765568017959595
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,7168,2048,8,384,4,4,balanced,0.5936959981918335
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,7168,2048,8,384,2,8,power_law_1.2,0.2992768049240112
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,7168,2048,8,384,4,4,balanced,0.6186133225758871
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,7168,2048,8,384,2,8,power_law_1.2,0.30560638904571535
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,7168,2048,8,384,4,4,balanced,0.6567893425623575
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,7168,2048,8,384,2,8,power_law_1.2,0.33673601150512694
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,7168,2048,8,384,2,8,power_law_1.2,0.37353599071502686
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,7168,2048,8,384,4,4,balanced,0.698474645614624
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,7168,2048,8,384,2,8,power_law_1.2,0.46477441787719725
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,7168,2048,8,384,4,4,balanced,0.763871987660726
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,7168,2048,8,384,4,4,balanced,0.050053333242734276
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,384,2,8,power_law_1.2,0.4889023780822754
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,7168,2048,8,384,4,4,balanced,0.0539626677831014
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,7168,2048,8,384,4,4,balanced,0.8522240320841471
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,7168,2048,8,384,4,4,balanced,0.06489600241184235
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,7168,2048,8,384,4,4,balanced,0.09210667014122009
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,384,2,8,power_law_1.2,0.5240320205688477
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,7168,2048,8,384,4,4,balanced,0.13760000467300415
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,384,2,8,power_law_1.2,0.6604608058929443
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,7168,2048,8,384,4,4,balanced,0.21921066443125406
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,7168,2048,8,384,4,4,balanced,0.9962773323059082
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,384,2,8,power_law_1.2,0.8902144432067871
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,7168,2048,8,384,4,4,balanced,0.30270934104919434
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,7168,2048,8,384,4,4,balanced,0.3053973317146301
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,384,2,8,power_law_1.2,1.0182016372680665
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,7168,2048,8,384,4,4,balanced,0.3046506643295288
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,384,2,8,power_law_1.2,1.4096192359924316
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,7168,2048,8,384,4,4,balanced,0.30871466795603436
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,7168,2048,8,384,4,4,balanced,1.2533600330352783
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,7168,2048,8,384,4,4,balanced,0.3089173237482707
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,384,2,8,power_law_1.2,1.7445632934570312
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,7168,2048,8,384,4,4,balanced,0.3130720059076945
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,384,2,8,power_law_1.2,2.785548782348633
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,7168,2048,8,384,4,4,balanced,0.31706132491429645
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,7168,2048,8,384,4,4,balanced,0.32528533538182575
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,384,2,8,power_law_1.2,3.793209457397461
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,7168,2048,8,384,4,4,balanced,0.3359733422597249
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,384,2,8,power_law_1.2,4.402944183349609
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,7168,2048,8,384,4,4,balanced,0.06734933455785115
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,7168,2048,8,384,4,4,balanced,1.5301440556844075
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,7168,2048,8,384,4,4,balanced,0.3392373323440552
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,7168,2048,8,384,4,4,balanced,0.07331733405590057
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,7168,2048,8,384,4,4,balanced,0.3507946729660034
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,384,2,8,power_law_1.2,6.754783630371094
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,7168,2048,8,384,4,4,balanced,0.08281066517035167
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,7168,2048,8,384,4,4,balanced,0.37646933396657306
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,7168,2048,8,384,4,4,balanced,0.10817066828409831
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,7168,2048,8,384,4,4,balanced,0.3954293330510457
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,7168,2048,8,384,4,4,balanced,0.15481600165367126
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,384,2,8,power_law_1.2,14.821369934082032
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,7168,2048,8,384,4,4,balanced,0.23705067237218222
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,7168,2048,8,384,4,4,balanced,0.43691198031107586
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,7168,2048,8,384,4,4,balanced,0.3237920006116231
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,7168,2048,8,384,4,4,balanced,0.3264426589012146
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,7168,2048,8,384,4,4,balanced,2.0330665906270347
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,7168,2048,8,384,4,4,balanced,0.48447998364766437
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,7168,2048,8,384,4,4,balanced,0.3267786701520284
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,7168,2048,8,384,4,4,power_law_1.01,0.0856768012046814
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,7168,2048,8,384,4,4,power_law_1.01,0.06483839750289917
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,7168,2048,8,384,4,4,balanced,0.3298719922701518
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,7168,2048,8,384,4,4,power_law_1.01,0.12102400064468384
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,7168,2048,8,384,4,4,balanced,0.5704319874445597
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,7168,2048,8,384,4,4,power_law_1.01,0.08388479948043823
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,7168,2048,8,384,4,4,balanced,0.33372267087300617
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,7168,2048,8,384,4,4,power_law_1.01,0.20067839622497557
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,7168,2048,8,384,4,4,balanced,0.33825600147247314
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,7168,2048,8,384,4,4,power_law_1.01,0.12677760124206544
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,7168,2048,8,384,4,4,power_law_1.01,0.12394239902496337
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,7168,2048,8,384,4,4,balanced,0.6633973519007365
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,7168,2048,8,384,4,4,balanced,0.34357865651448566
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,7168,2048,8,384,4,4,power_law_1.01,0.08177919983863831
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,7168,2048,8,384,4,4,power_law_1.01,0.16983040571212768
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,7168,2048,8,384,4,4,balanced,0.35021865367889404
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,7168,2048,8,384,4,4,power_law_1.01,0.12465920448303222
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,7168,2048,8,384,4,4,power_law_1.01,0.24559359550476073
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,7168,2048,8,384,4,4,balanced,0.3646293481190999
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,7168,2048,8,384,4,4,power_law_1.01,0.16216959953308105
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,7168,2048,8,384,4,4,balanced,0.8184266885121664
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,7168,2048,8,384,4,4,balanced,2.6018880208333335
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,7168,2048,8,384,4,4,power_law_1.01,0.27242240905761717
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,7168,2048,8,384,4,4,balanced,0.3720533450444539
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,7168,2048,8,384,4,4,power_law_1.01,0.1751360058784485
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,7168,2048,8,384,4,4,power_law_1.01,0.3631808042526245
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,7168,2048,8,384,4,4,balanced,0.387114683787028
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,7168,2048,8,384,4,4,power_law_1.01,0.21342079639434813
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,7168,2048,8,384,4,4,power_law_1.01,0.3886271953582764
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,7168,2048,8,384,4,4,balanced,0.42341868082682294
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,7168,2048,8,384,4,4,power_law_1.01,0.22622718811035156
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,7168,2048,8,384,4,4,power_law_1.01,0.4043903827667236
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,7168,2048,8,384,4,4,balanced,1.0554133256276448
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,7168,2048,8,384,4,4,power_law_1.01,0.22929279804229735
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,7168,2048,8,384,4,4,power_law_1.01,0.4386240005493164
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,7168,2048,8,384,4,4,power_law_1.01,0.24530560970306398
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,7168,2048,8,384,4,4,power_law_1.01,0.4548799991607666
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,7168,2048,8,384,4,4,power_law_1.01,0.2555455923080444
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,7168,2048,8,384,4,4,power_law_1.01,0.08759679794311523
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,7168,2048,8,384,4,4,power_law_1.01,0.4560704231262207
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,384,4,4,balanced,0.474234660466512
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,7168,2048,8,384,4,4,power_law_1.01,0.27139840126037595
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,7168,2048,8,384,4,4,power_law_1.01,0.4660352230072021
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,7168,2048,8,384,4,4,power_law_1.01,0.10860799551010132
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,7168,2048,8,384,4,4,power_law_1.01,0.2765952110290527
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,7168,2048,8,384,4,4,power_law_1.01,0.15040639638900757
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,7168,2048,8,384,4,4,balanced,1.395802656809489
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,7168,2048,8,384,4,4,power_law_1.01,0.49716482162475584
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,7168,2048,8,384,4,4,power_law_1.01,0.10518399477005005
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,7168,2048,8,384,4,4,power_law_1.01,0.2947904109954834
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,7168,2048,8,384,4,4,power_law_1.01,0.50797438621521
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,7168,2048,8,384,4,4,power_law_1.01,0.13708159923553467
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,7168,2048,8,384,4,4,power_law_1.01,0.29808640480041504
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,7168,2048,8,384,4,4,power_law_1.01,0.5318079948425293
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,7168,2048,8,384,4,4,power_law_1.01,0.17282559871673583
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,7168,2048,8,384,4,4,balanced,3.9186347325642905
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,384,4,4,balanced,0.5927306811014811
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,7168,2048,8,384,4,4,power_law_1.01,0.20137600898742675
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,7168,2048,8,384,4,4,power_law_1.01,0.5893119812011719
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,7168,2048,8,384,4,4,power_law_1.01,0.3098047971725464
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,7168,2048,8,384,4,4,power_law_1.01,0.23554561138153077
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,7168,2048,8,384,4,4,power_law_1.01,0.3569024085998535
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,7168,2048,8,384,4,4,power_law_1.01,0.6054143905639648
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,7168,2048,8,384,4,4,power_law_1.01,0.24456961154937745
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,384,4,4,balanced,0.6740852991739908
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,7168,2048,8,384,4,4,power_law_1.01,0.26340479850769044
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,7168,2048,8,384,4,4,power_law_1.01,0.7349503993988037
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,7168,2048,8,384,4,4,power_law_1.01,0.3939519882202148
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,7168,2048,8,384,4,4,balanced,1.835840066274007
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,7168,2048,8,384,4,4,power_law_1.01,0.2744960069656372
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,384,4,4,balanced,0.8051253159840902
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,7168,2048,8,384,4,4,power_law_1.01,0.7400191783905029
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,7168,2048,8,384,4,4,power_law_1.01,0.48728318214416505
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,7168,2048,8,384,4,4,power_law_1.01,0.28225278854370117
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,7168,2048,8,384,4,4,power_law_1.01,0.9617983818054199
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,7168,2048,8,384,4,4,power_law_1.01,0.28928000926971437
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,7168,2048,8,384,4,4,power_law_1.01,0.5260032176971435
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,7168,2048,8,384,4,4,power_law_1.01,0.31734399795532225
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,7168,2048,8,384,4,4,power_law_1.01,0.9659328460693359
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,384,4,4,balanced,1.015328009923299
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,7168,2048,8,384,4,4,power_law_1.01,0.6659135818481445
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,7168,2048,8,384,4,4,power_law_1.01,0.34442241191864015
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,7168,2048,8,384,4,4,power_law_1.01,1.1755200386047364
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,7168,2048,8,384,4,4,power_law_1.01,0.36148478984832766
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,7168,2048,8,384,4,4,power_law_1.01,0.7677375793457031
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,7168,2048,8,384,4,4,power_law_1.01,0.3981760025024414
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,7168,2048,8,384,4,4,power_law_1.01,1.500499153137207
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,7168,2048,8,384,4,4,power_law_1.01,1.0186688423156738
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,7168,2048,8,384,4,4,power_law_1.01,0.4767295837402344
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,384,4,4,balanced,1.2889706293741863
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,7168,2048,8,384,4,4,power_law_1.01,2.059129524230957
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,7168,2048,8,384,4,4,power_law_1.01,1.187820816040039
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,7168,2048,8,384,4,4,balanced,2.3187146186828613
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,7168,2048,8,384,4,4,power_law_1.01,2.480300712585449
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,7168,2048,8,384,4,4,power_law_1.01,1.6593727111816405
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,384,4,4,power_law_1.01,0.5475071907043457
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,7168,2048,8,384,4,4,power_law_1.01,3.1902591705322267
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,7168,2048,8,384,4,4,power_law_1.01,2.1005952835083006
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,7168,2048,8,384,4,4,power_law_1.2,0.08573439717292786
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,384,4,4,balanced,1.820053259531657
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,384,4,4,power_law_1.01,0.6346240043640137
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,7168,2048,8,384,4,4,power_law_1.01,2.543270492553711
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,7168,2048,8,384,4,4,power_law_1.01,4.7302593231201175
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,7168,2048,8,384,4,4,power_law_1.2,0.12120319604873657
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,384,4,4,power_law_1.01,0.7534336090087891
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,7168,2048,8,384,4,4,power_law_1.2,0.12313599586486816
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,7168,2048,8,384,4,4,power_law_1.01,4.0271553039550785
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,384,4,4,power_law_1.01,0.9905599594116211
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,7168,2048,8,384,4,4,power_law_1.01,8.568505859375
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,7168,2048,8,384,4,4,power_law_1.2,0.12643840312957763
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,384,4,4,power_law_1.01,1.142956829071045
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,7168,2048,8,384,4,4,power_law_1.01,7.6290946960449215
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,384,4,4,power_law_1.01,1.606015968322754
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,7168,2048,8,384,4,4,power_law_1.2,0.1600000023841858
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,384,4,4,balanced,2.4076266288757324
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,384,4,4,power_law_1.01,2.192736053466797
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,7168,2048,8,384,4,4,power_law_1.2,0.2205120086669922
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,384,4,4,power_law_1.01,2.9742656707763673
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,7168,2048,8,384,4,4,power_law_1.2,0.25474560260772705
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,384,4,4,power_law_1.01,3.8129920959472656
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,7168,2048,8,384,4,4,power_law_1.2,0.3670783996582031
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,384,4,4,power_law_1.01,5.06363525390625
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,7168,2048,8,384,4,4,power_law_1.2,0.3671231985092163
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,7168,2048,8,384,4,4,balanced,3.5244534810384116
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,384,4,4,power_law_1.01,7.583929443359375
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,7168,2048,8,384,4,4,power_law_1.2,0.37763841152191163
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,7168,2048,8,384,4,4,balanced,7.275199890136719
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,7168,2048,8,384,4,4,power_law_1.2,0.41505918502807615
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,384,4,4,balanced,3.298709233601888
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,384,4,4,power_law_1.01,15.194406127929687
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,7168,2048,8,384,4,4,power_law_1.2,0.44099841117858884
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,7168,2048,8,384,4,4,power_law_1.2,0.4490623950958252
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,7168,2048,8,384,4,4,power_law_1.2,0.47380480766296384
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,7168,2048,8,384,4,4,power_law_1.2,0.4707520008087158
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,7168,2048,8,384,4,4,power_law_1.2,0.5059199810028077
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,7168,2048,8,384,4,4,power_law_1.2,0.5360767841339111
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,384,4,4,balanced,4.161946614583333
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,7168,2048,8,384,4,4,power_law_1.2,0.6082880020141601
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,7168,2048,8,384,4,4,power_law_1.2,0.6666751861572265
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,7168,2048,8,384,4,4,power_law_1.2,0.7240640163421631
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,7168,2048,8,384,4,4,power_law_1.2,0.8116543769836426
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,7168,2048,8,384,4,4,power_law_1.2,0.9523008346557618
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,7168,2048,8,384,4,4,power_law_1.2,0.9694720268249511
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,7168,2048,8,384,4,4,power_law_1.2,1.22992000579834
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,7168,2048,8,384,4,4,power_law_1.2,1.567628765106201
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,7168,2048,8,384,4,4,power_law_1.2,2.2354496002197264
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,384,4,4,balanced,6.487738927205403
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,7168,2048,8,384,4,4,power_law_1.2,2.8175167083740233
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,7168,2048,8,384,4,4,balanced,6.6231733957926435
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,7168,2048,8,384,4,4,power_law_1.2,3.551443099975586
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,7168,2048,8,384,4,4,power_law_1.2,0.06516479849815368
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,7168,2048,8,384,4,4,power_law_1.2,0.08373759984970093
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,7168,2048,8,384,4,4,power_law_1.2,5.0732990264892575
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,7168,2048,8,384,4,4,power_law_1.2,0.09002879858016968
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,7168,2048,8,384,4,4,power_law_1.2,0.0926144003868103
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,7168,2048,8,384,4,4,power_law_1.2,9.860243225097657
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,7168,2048,8,384,4,4,power_law_1.2,0.11916799545288086
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,7168,2048,8,384,4,4,power_law_1.2,0.1456063985824585
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,7168,2048,8,384,4,4,power_law_1.2,0.1651136040687561
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,7168,2048,8,384,4,4,power_law_1.2,0.20755839347839355
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,7168,2048,8,384,4,4,power_law_1.2,0.22189440727233886
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,7168,2048,8,384,4,4,power_law_1.2,0.22327680587768556
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,7168,2048,8,384,4,4,power_law_1.2,0.23688321113586425
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,7168,2048,8,384,4,4,power_law_1.2,0.2537087917327881
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,7168,2048,8,384,4,4,power_law_1.2,0.26075520515441897
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,7168,2048,8,384,4,4,power_law_1.2,0.2777087926864624
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,7168,2048,8,384,4,4,power_law_1.2,0.2932096004486084
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,7168,2048,8,384,4,4,power_law_1.2,0.3073024034500122
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,7168,2048,8,384,4,4,power_law_1.2,0.3254463911056519
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,7168,2048,8,384,4,4,power_law_1.2,0.37275519371032717
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,384,4,4,balanced,12.758810679117838
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,7168,2048,8,384,4,4,power_law_1.2,0.39800961017608644
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,7168,2048,8,384,4,4,power_law_1.2,0.4794816017150879
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,7168,2048,8,384,4,4,power_law_1.2,0.5538432121276855
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,7168,2048,8,384,4,4,power_law_1.2,0.6932479858398437
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,7168,2048,8,384,4,4,power_law_1.2,0.7917695999145508
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,7168,2048,8,384,4,4,power_law_1.2,1.0765376091003418
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,7168,2048,8,384,4,4,power_law_1.2,1.322822380065918
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,7168,2048,8,384,4,4,power_law_1.2,1.8266752243041993
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,7168,2048,8,384,4,4,power_law_1.2,2.159974479675293
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,7168,2048,8,384,4,4,power_law_1.2,2.7931840896606444
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,7168,2048,8,384,4,4,power_law_1.2,4.119577789306641
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,7168,2048,8,384,4,4,power_law_1.2,8.469145965576171
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,7168,2048,8,384,8,2,balanced,0.06190933287143707
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,7168,2048,8,384,8,2,balanced,0.06997333467006683
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,7168,2048,8,384,8,2,balanced,0.08667199810345967
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,7168,2048,8,384,4,4,power_law_1.2,0.08796799778938294
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,7168,2048,8,384,8,2,balanced,0.13499200344085693
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,7168,2048,8,384,4,4,power_law_1.2,0.10810240507125854
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,7168,2048,8,384,8,2,balanced,0.22334933280944824
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,7168,2048,8,384,4,4,power_law_1.2,0.1114240050315857
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,7168,2048,8,384,8,2,balanced,0.3834826548894246
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,7168,2048,8,384,4,4,power_law_1.2,0.09687680006027222
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,7168,2048,8,384,8,2,balanced,0.5519573291142782
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,7168,2048,8,384,8,2,balanced,0.053717335065205894
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,7168,2048,8,384,8,2,balanced,0.55731733640035
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,7168,2048,8,384,4,4,power_law_1.2,0.13242239952087403
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,7168,2048,8,384,8,2,balanced,0.5543466806411743
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,7168,2048,8,384,8,2,balanced,0.05761066575845083
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,7168,2048,8,384,4,4,power_law_1.2,0.16248960494995118
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,7168,2048,8,384,8,2,balanced,0.06902400155862172
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,7168,2048,8,384,8,2,balanced,0.557375987370809
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,7168,2048,8,384,4,4,power_law_1.2,0.17793279886245728
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,7168,2048,8,384,8,2,balanced,0.09886399904886882
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,7168,2048,8,384,8,2,balanced,0.5604480107625326
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,7168,2048,8,384,4,4,power_law_1.2,0.22581119537353517
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,7168,2048,8,384,8,2,balanced,0.14761599898338318
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,7168,2048,8,384,8,2,balanced,0.5656799872716268
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,7168,2048,8,384,8,2,balanced,0.24761066834131876
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,7168,2048,8,384,4,4,power_law_1.2,0.23882880210876464
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,7168,2048,8,384,8,2,balanced,0.5669973293940226
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,7168,2048,8,384,8,2,balanced,0.3439626693725586
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,7168,2048,8,384,4,4,power_law_1.2,0.2514688014984131
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,7168,2048,8,384,8,2,balanced,0.5762826601664225
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,7168,2048,8,384,8,2,balanced,0.09777599573135376
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,7168,2048,8,384,8,2,balanced,0.3473386764526367
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,7168,2048,8,384,4,4,power_law_1.2,0.267795205116272
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,7168,2048,8,384,8,2,balanced,0.589792013168335
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,7168,2048,8,384,8,2,balanced,0.35101866722106934
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,7168,2048,8,384,8,2,balanced,0.10591999689737956
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,7168,2048,8,384,4,4,power_law_1.2,0.2744704008102417
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,7168,2048,8,384,8,2,balanced,0.5961759885152181
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,7168,2048,8,384,8,2,balanced,0.3540053367614746
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,7168,2048,8,384,8,2,balanced,0.11352533102035522
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,7168,2048,8,384,4,4,power_law_1.2,0.2968640089035034
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,7168,2048,8,384,8,2,balanced,0.3585760196050008
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,7168,2048,8,384,8,2,balanced,0.6034026543299357
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,7168,2048,8,384,8,2,balanced,0.13941867152849832
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,7168,2048,8,384,8,2,balanced,0.3702186743418376
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,7168,2048,8,384,4,4,power_law_1.2,0.3219583988189697
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,7168,2048,8,384,8,2,balanced,0.18628267447153726
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,7168,2048,8,384,8,2,balanced,0.6288906733194987
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,7168,2048,8,384,8,2,balanced,0.3729706605275472
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,7168,2048,8,384,4,4,power_law_1.2,0.35383679866790774
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,7168,2048,8,384,8,2,balanced,0.28888533512751263
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,7168,2048,8,384,8,2,balanced,0.38442667325337726
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,7168,2048,8,384,8,2,balanced,0.6836640040079752
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,7168,2048,8,384,4,4,power_law_1.2,0.3633471965789795
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,7168,2048,8,384,8,2,balanced,0.3887840112050374
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,7168,2048,8,384,8,2,balanced,0.396778662999471
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,7168,2048,8,384,8,2,balanced,0.39289601643880206
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,7168,2048,8,384,4,4,power_law_1.2,0.4185344219207764
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,7168,2048,8,384,8,2,balanced,0.7363466421763102
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,7168,2048,8,384,8,2,balanced,0.40668265024820965
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,7168,2048,8,384,8,2,balanced,0.3973653316497803
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,7168,2048,8,384,4,4,power_law_1.2,0.49266557693481444
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,7168,2048,8,384,8,2,balanced,0.4034239848454793
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,7168,2048,8,384,8,2,balanced,0.8004799683888754
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,7168,2048,8,384,8,2,balanced,0.4240320126215617
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,7168,2048,8,384,8,2,balanced,0.4100106557210286
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,7168,2048,8,384,8,2,balanced,0.45216532548268634
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,7168,2048,8,384,8,2,balanced,0.42021334171295166
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,384,4,4,power_law_1.2,0.5678080081939697
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,7168,2048,8,384,8,2,balanced,0.9206720193227133
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,7168,2048,8,384,8,2,balanced,0.4764480193456014
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,7168,2048,8,384,8,2,balanced,0.4264959891637166
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,7168,2048,8,384,8,2,balanced,0.44017601013183594
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,7168,2048,8,384,8,2,balanced,0.5409653186798096
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,384,4,4,power_law_1.2,0.6531904220581055
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,7168,2048,8,384,8,2,balanced,1.0550506909688313
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,7168,2048,8,384,8,2,balanced,0.45739734172821045
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,384,4,4,power_law_1.2,0.7718912124633789
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,7168,2048,8,384,8,2,balanced,0.6172426541646322
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,7168,2048,8,384,8,2,balanced,0.4694133202234904
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,384,4,4,power_law_1.2,1.0520832061767578
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,7168,2048,8,384,8,2,balanced,0.5096960067749023
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,7168,2048,8,384,8,2,balanced,1.286847988764445
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,7168,2048,8,384,8,2,balanced,0.7165493170420328
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,7168,2048,8,384,8,2,balanced,0.5817919969558716
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,384,4,4,power_law_1.2,1.264025592803955
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,384,4,4,power_law_1.2,1.6244287490844727
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,7168,2048,8,384,8,2,balanced,0.8497280279795328
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,384,4,4,power_law_1.2,2.2716415405273436
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,7168,2048,8,384,8,2,power_law_1.01,0.06727679967880248
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,7168,2048,8,384,8,2,balanced,1.6429866154988606
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,384,4,4,power_law_1.2,3.093657684326172
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,384,8,2,balanced,0.6772586504618326
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,7168,2048,8,384,8,2,power_law_1.01,0.08331519961357117
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,7168,2048,8,384,8,2,balanced,1.10426131884257
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,384,4,4,power_law_1.2,4.146438217163086
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,7168,2048,8,384,8,2,power_law_1.01,0.12562559843063353
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,384,4,4,power_law_1.2,5.723020935058594
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,7168,2048,8,384,8,2,power_law_1.01,0.10957440137863159
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,7168,2048,8,384,8,2,power_law_1.01,0.055430400371551516
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,7168,2048,8,384,8,2,power_law_1.01,0.17520639896392823
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,7168,2048,8,384,8,2,balanced,2.135050614674886
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,384,4,4,power_law_1.2,8.64552993774414
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,7168,2048,8,384,8,2,power_law_1.01,0.24579839706420897
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,7168,2048,8,384,8,2,power_law_1.01,0.06656640172004699
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,7168,2048,8,384,8,2,balanced,1.4408213297526042
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,384,8,2,balanced,0.8810933430989584
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,7168,2048,8,384,8,2,power_law_1.01,0.29818239212036135
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,7168,2048,8,384,8,2,power_law_1.01,0.09164800047874451
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,384,8,2,balanced,1.024997313817342
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,7168,2048,8,384,8,2,power_law_1.01,0.36789760589599607
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,7168,2048,8,384,8,2,power_law_1.01,0.08105599880218506
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,384,4,4,power_law_1.2,17.618540954589843
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,7168,2048,8,384,8,2,power_law_1.01,0.12459520101547242
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,7168,2048,8,384,8,2,power_law_1.01,0.3802623987197876
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,384,8,2,balanced,1.2317919731140137
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,7168,2048,8,384,8,2,power_law_1.01,0.16879359483718873
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,7168,2048,8,384,8,2,power_law_1.01,0.4113471984863281
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,7168,2048,8,384,8,2,balanced,1.985498587290446
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,7168,2048,8,384,8,2,power_law_1.01,0.1813055992126465
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,7168,2048,8,384,8,2,power_law_1.01,0.4337791919708252
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,7168,2048,8,384,8,2,balanced,2.800959904988607
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,384,8,2,balanced,1.633776028951009
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,7168,2048,8,384,8,2,power_law_1.01,0.23444480895996095
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,7168,2048,8,384,8,2,power_law_1.01,0.465715217590332
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,7168,2048,8,384,8,2,power_law_1.01,0.24567039012908937
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,7168,2048,8,384,8,2,power_law_1.01,0.4826176166534424
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,7168,2048,8,384,8,2,power_law_1.01,0.2557440042495728
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,7168,2048,8,384,8,2,power_law_1.01,0.4972799777984619
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,384,8,2,balanced,2.117695967356364
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,7168,2048,8,384,8,2,power_law_1.01,0.27956480979919435
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,7168,2048,8,384,8,2,power_law_1.01,0.5408639907836914
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,7168,2048,8,384,8,2,power_law_1.01,0.2800256013870239
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,7168,2048,8,384,8,2,power_law_1.01,0.5548416137695312
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,7168,2048,8,384,8,2,balanced,2.546010653177897
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,7168,2048,8,384,8,2,power_law_1.01,0.2930111885070801
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,7168,2048,8,384,8,2,power_law_1.01,0.5598144054412841
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,384,8,2,balanced,3.035914738972982
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,7168,2048,8,384,8,2,power_law_1.01,0.32741758823394773
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,7168,2048,8,384,8,2,balanced,3.4919252395629883
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,7168,2048,8,384,8,2,power_law_1.01,0.6084352016448975
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,7168,2048,8,384,8,2,power_law_1.01,0.3455424070358276
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,7168,2048,8,384,8,2,power_law_1.01,0.6508927822113038
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,7168,2048,8,384,8,2,power_law_1.01,0.09806720018386841
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,7168,2048,8,384,8,2,power_law_1.01,0.36833279132843016
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,7168,2048,8,384,8,2,power_law_1.01,0.7982143878936767
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,7168,2048,8,384,8,2,power_law_1.01,0.11146880388259887
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,7168,2048,8,384,8,2,power_law_1.01,0.371724796295166
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,7168,2048,8,384,8,2,power_law_1.01,0.8684672355651856
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,7168,2048,8,384,8,2,power_law_1.01,0.13898240327835082
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,7168,2048,8,384,8,2,power_law_1.01,0.4210559844970703
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,7168,2048,8,384,8,2,power_law_1.01,1.0423295974731446
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,384,8,2,balanced,4.101903915405273
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,7168,2048,8,384,8,2,power_law_1.01,0.1313024044036865
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,7168,2048,8,384,8,2,power_law_1.01,0.4853184223175049
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,7168,2048,8,384,8,2,balanced,3.1930452982584634
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,7168,2048,8,384,8,2,power_law_1.01,1.163590431213379
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,7168,2048,8,384,8,2,power_law_1.01,0.16904319524765016
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,7168,2048,8,384,8,2,power_law_1.01,0.6094336032867431
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,7168,2048,8,384,8,2,power_law_1.01,0.20785920619964598
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,7168,2048,8,384,8,2,power_law_1.01,1.428268814086914
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,7168,2048,8,384,8,2,power_law_1.01,0.6165056228637695
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,7168,2048,8,384,8,2,power_law_1.01,0.23255679607391358
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,7168,2048,8,384,8,2,power_law_1.01,0.7640960216522217
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,7168,2048,8,384,8,2,power_law_1.01,2.0070592880249025
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,7168,2048,8,384,8,2,power_law_1.01,0.28022398948669436
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,7168,2048,8,384,8,2,power_law_1.01,0.9073663711547851
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,7168,2048,8,384,8,2,power_law_1.01,2.742585563659668
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,7168,2048,8,384,8,2,power_law_1.01,0.2926271915435791
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,7168,2048,8,384,8,2,power_law_1.2,0.06730239987373351
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,7168,2048,8,384,8,2,power_law_1.01,1.1657407760620118
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,7168,2048,8,384,8,2,balanced,5.292997360229492
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,384,8,2,balanced,5.566127777099609
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,7168,2048,8,384,8,2,power_law_1.01,0.3096127986907959
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,7168,2048,8,384,8,2,power_law_1.01,2.9767488479614257
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,7168,2048,8,384,8,2,power_law_1.2,0.08314239978790283
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,7168,2048,8,384,8,2,power_law_1.01,1.6591615676879883
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,7168,2048,8,384,8,2,power_law_1.01,0.3271424055099487
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,7168,2048,8,384,8,2,power_law_1.2,0.0932096004486084
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,7168,2048,8,384,8,2,power_law_1.01,3.5934207916259764
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,7168,2048,8,384,8,2,power_law_1.01,2.278060722351074
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,7168,2048,8,384,8,2,power_law_1.2,0.11362559795379638
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,7168,2048,8,384,8,2,power_law_1.01,0.3501375913619995
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,7168,2048,8,384,8,2,power_law_1.2,0.1656448006629944
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,7168,2048,8,384,8,2,power_law_1.01,2.7226112365722654
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,7168,2048,8,384,8,2,power_law_1.01,0.36601600646972654
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,7168,2048,8,384,8,2,power_law_1.01,5.654073715209961
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,7168,2048,8,384,8,2,power_law_1.2,0.22181758880615235
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,7168,2048,8,384,8,2,power_law_1.2,0.26131200790405273
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,7168,2048,8,384,8,2,power_law_1.01,0.4049407958984375
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,7168,2048,8,384,8,2,power_law_1.01,3.251660919189453
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,7168,2048,8,384,8,2,power_law_1.2,0.34339840412139894
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,7168,2048,8,384,8,2,power_law_1.01,0.431001615524292
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,7168,2048,8,384,8,2,power_law_1.01,10.970291137695312
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,7168,2048,8,384,8,2,power_law_1.2,0.3764031887054443
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,7168,2048,8,384,8,2,power_law_1.01,5.135475158691406
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,7168,2048,8,384,8,2,balanced,4.956410725911458
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,7168,2048,8,384,8,2,power_law_1.01,0.46752638816833497
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,7168,2048,8,384,8,2,power_law_1.2,0.3771967887878418
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,7168,2048,8,384,8,2,power_law_1.2,0.4036287784576416
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,7168,2048,8,384,8,2,power_law_1.01,0.5366591930389404
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,384,8,2,balanced,6.874613444010417
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,7168,2048,8,384,8,2,power_law_1.01,10.174598693847656
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,7168,2048,8,384,8,2,power_law_1.2,0.43006081581115724
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,7168,2048,8,384,8,2,power_law_1.01,0.6796800136566162
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,7168,2048,8,384,8,2,power_law_1.2,0.47867522239685056
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,7168,2048,8,384,8,2,power_law_1.2,0.49891200065612795
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,7168,2048,8,384,8,2,power_law_1.2,0.5237311840057373
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,7168,2048,8,384,8,2,power_law_1.2,0.5751039981842041
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,384,8,2,power_law_1.01,0.7707200050354004
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,7168,2048,8,384,8,2,power_law_1.2,0.5503104209899903
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,7168,2048,8,384,8,2,power_law_1.2,0.629695987701416
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,7168,2048,8,384,8,2,power_law_1.2,0.6999872207641602
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,384,8,2,power_law_1.01,0.8931520462036133
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,7168,2048,8,384,8,2,power_law_1.2,0.8272831916809082
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,7168,2048,8,384,8,2,power_law_1.2,0.8788352012634277
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,384,8,2,power_law_1.01,1.0692416191101075
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,7168,2048,8,384,8,2,power_law_1.2,1.1060735702514648
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,384,8,2,power_law_1.01,1.4029952049255372
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,7168,2048,8,384,8,2,power_law_1.2,1.2001664161682128
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,384,8,2,power_law_1.01,1.7412799835205077
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,7168,2048,8,384,8,2,power_law_1.2,1.5108991622924806
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,7168,2048,8,384,8,2,power_law_1.2,2.2373056411743164
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,384,8,2,power_law_1.01,2.455027198791504
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,7168,2048,8,384,8,2,power_law_1.2,2.810304069519043
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,384,8,2,balanced,10.769418080647787
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,384,8,2,power_law_1.01,3.0835391998291017
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,7168,2048,8,384,8,2,power_law_1.2,3.0969152450561523
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,384,8,2,power_law_1.01,4.572415924072265
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,7168,2048,8,384,8,2,balanced,9.78988774617513
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,7168,2048,8,384,8,2,power_law_1.2,3.9857086181640624
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,384,8,2,power_law_1.01,5.971225738525391
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,7168,2048,8,384,8,2,power_law_1.2,5.702924728393555
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,384,8,2,power_law_1.01,7.747955322265625
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,7168,2048,8,384,8,2,power_law_1.2,12.206034851074218
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,384,8,2,power_law_1.01,11.157785797119141
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,7168,2048,8,384,8,2,balanced,9.309200286865234
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,384,8,2,power_law_1.01,22.499591064453124
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,384,8,2,balanced,21.170565287272137
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,7168,2048,8,384,8,2,power_law_1.2,0.055219197273254396
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,7168,2048,8,384,8,2,power_law_1.2,0.06665599942207337
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,7168,2048,8,384,8,2,power_law_1.2,0.07416960000991821
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,7168,2048,8,384,8,2,power_law_1.2,0.08729599714279175
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,7168,2048,8,384,8,2,power_law_1.2,0.11213439702987671
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,7168,2048,8,384,8,2,power_law_1.2,0.15088000297546386
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,7168,2048,8,384,8,2,power_law_1.2,0.1708351969718933
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,7168,2048,8,384,8,2,power_law_1.2,0.22977919578552247
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,7168,2048,8,384,8,2,power_law_1.2,0.24689919948577882
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,7168,2048,8,384,8,2,power_law_1.2,0.24519040584564208
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,7168,2048,8,384,8,2,power_law_1.2,0.26590719223022463
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,7168,2048,8,384,8,2,power_law_1.2,0.27923200130462644
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,7168,2048,8,384,8,2,power_law_1.2,0.294815993309021
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,7168,2048,8,384,8,2,power_law_1.2,0.3118016004562378
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,7168,2048,8,384,8,2,power_law_1.2,0.3555392026901245
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,7168,2048,8,384,8,2,power_law_1.2,0.36888320446014405
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,7168,2048,8,384,8,2,power_law_1.2,0.37401599884033204
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,7168,2048,8,384,8,2,power_law_1.2,0.438259220123291
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,7168,2048,8,384,8,2,power_law_1.2,0.4889472007751465
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,7168,2048,8,384,8,2,power_law_1.2,0.609548807144165
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,7168,2048,8,384,8,2,power_law_1.2,0.6588352203369141
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,7168,2048,8,384,8,2,power_law_1.2,0.8287424087524414
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,7168,2048,8,384,8,2,power_law_1.2,0.9534720420837403
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,7168,2048,8,384,8,2,power_law_1.2,1.2355520248413085
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,7168,2048,8,384,8,2,power_law_1.2,1.7892864227294922
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,7168,2048,8,384,8,2,power_law_1.2,2.418809509277344
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,7168,2048,8,384,8,2,power_law_1.2,2.722547149658203
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,7168,2048,8,384,8,2,power_law_1.2,3.4187648773193358
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,7168,2048,8,384,8,2,power_law_1.2,5.498246383666992
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,7168,2048,8,384,16,1,balanced,0.06857066849867503
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,7168,2048,8,384,16,1,balanced,0.07667733232180278
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,7168,2048,8,384,8,2,power_law_1.2,0.09816960096359253
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,7168,2048,8,384,8,2,power_law_1.2,10.980083465576172
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,7168,2048,8,384,16,1,balanced,0.09759466846783955
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,7168,2048,8,384,16,1,balanced,0.1504693329334259
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,7168,2048,8,384,8,2,power_law_1.2,0.11099519729614257
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,7168,2048,8,384,16,1,balanced,0.24668800830841064
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,7168,2048,8,384,8,2,power_law_1.2,0.11605119705200195
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,7168,2048,8,384,16,1,balanced,0.43565332889556885
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,7168,2048,8,384,16,1,balanced,0.617738684018453
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,7168,2048,8,384,8,2,power_law_1.2,0.12687360048294066
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,7168,2048,8,384,16,1,balanced,0.6233919858932495
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,7168,2048,8,384,8,2,power_law_1.2,0.1565888047218323
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,7168,2048,8,384,16,1,balanced,0.6307413180669149
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,7168,2048,8,384,16,1,balanced,0.6295093297958374
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,7168,2048,8,384,8,2,power_law_1.2,0.1931391954421997
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,7168,2048,8,384,16,1,balanced,0.6268479824066162
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,7168,2048,8,384,8,2,power_law_1.2,0.2189120054244995
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,7168,2048,8,384,16,1,balanced,0.6343146562576294
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,7168,2048,8,384,8,2,power_law_1.2,0.2775167942047119
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,7168,2048,8,384,16,1,balanced,0.6398026545842489
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,7168,2048,8,384,16,1,balanced,0.0610453337430954
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,7168,2048,8,384,16,1,balanced,0.6493759950002035
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,7168,2048,8,384,8,2,power_law_1.2,0.29344639778137205
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,7168,2048,8,384,16,1,balanced,0.06612266600131989
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,7168,2048,8,384,16,1,balanced,0.6603946685791016
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,7168,2048,8,384,8,2,power_law_1.2,0.2998464107513428
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,7168,2048,8,384,16,1,balanced,0.08185600241025288
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,7168,2048,8,384,16,1,balanced,0.6652906735738119
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,7168,2048,8,384,16,1,balanced,0.11999467015266418
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,7168,2048,8,384,8,2,power_law_1.2,0.3283711910247803
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,7168,2048,8,384,16,1,balanced,0.684175968170166
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,7168,2048,8,384,16,1,balanced,0.18684800465901694
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,7168,2048,8,384,8,2,power_law_1.2,0.3481152057647705
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,7168,2048,8,384,16,1,balanced,0.736191987991333
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,7168,2048,8,384,16,1,balanced,0.3153866728146871
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,7168,2048,8,384,8,2,power_law_1.2,0.36233599185943605
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,7168,2048,8,384,16,1,balanced,0.44225064913431805
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,7168,2048,8,384,16,1,balanced,0.7907306353251139
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,7168,2048,8,384,16,1,balanced,0.4459466536839803
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,7168,2048,8,384,8,2,power_law_1.2,0.40241279602050783
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,7168,2048,8,384,16,1,balanced,0.8864906628926595
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,7168,2048,8,384,16,1,balanced,0.45024001598358154
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,7168,2048,8,384,8,2,power_law_1.2,0.4401343822479248
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,7168,2048,8,384,16,1,balanced,0.4562346537907918
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,7168,2048,8,384,8,2,power_law_1.2,0.47475199699401854
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,7168,2048,8,384,16,1,balanced,1.032474676767985
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,7168,2048,8,384,16,1,balanced,0.45943466822306317
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,7168,2048,8,384,8,2,power_law_1.2,0.5522047996520996
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,7168,2048,8,384,16,1,power_law_1.01,0.05533440113067627
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,7168,2048,8,384,16,1,balanced,0.4672000010808309
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,7168,2048,8,384,16,1,power_law_1.01,0.061791998147964475
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,7168,2048,8,384,16,1,balanced,1.2121866544087727
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,7168,2048,8,384,8,2,power_law_1.2,0.6700352191925049
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,7168,2048,8,384,16,1,power_law_1.01,0.06085759997367859
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,7168,2048,8,384,16,1,balanced,0.47419734795888263
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,7168,2048,8,384,16,1,power_law_1.01,0.070278400182724
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,7168,2048,8,384,16,1,balanced,0.489738663037618
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,7168,2048,8,384,16,1,power_law_1.01,0.07742080092430115
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,7168,2048,8,384,16,1,balanced,1.4401973088582356
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,7168,2048,8,384,16,1,power_law_1.01,0.093094402551651
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,7168,2048,8,384,16,1,balanced,0.5020480155944824
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,7168,2048,8,384,16,1,power_law_1.01,0.09553920030593872
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,384,8,2,power_law_1.2,0.7757887840270996
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,7168,2048,8,384,16,1,power_law_1.01,0.12177920341491699
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,7168,2048,8,384,16,1,balanced,0.1597866714000702
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,7168,2048,8,384,16,1,balanced,0.5182773272196451
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,7168,2048,8,384,16,1,power_law_1.01,0.1460543990135193
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,7168,2048,8,384,16,1,power_law_1.01,0.18765439987182617
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,7168,2048,8,384,16,1,balanced,0.17070400714874268
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,7168,2048,8,384,16,1,balanced,0.5470026731491089
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,7168,2048,8,384,16,1,power_law_1.01,0.20322558879852295
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,7168,2048,8,384,16,1,balanced,1.859674612681071
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,384,8,2,power_law_1.2,0.9264063835144043
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,7168,2048,8,384,16,1,power_law_1.01,0.2793407917022705
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,7168,2048,8,384,16,1,balanced,0.18444265921910605
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,7168,2048,8,384,16,1,power_law_1.01,0.22843520641326903
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,7168,2048,8,384,16,1,balanced,0.5947786569595337
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,7168,2048,8,384,16,1,balanced,0.2108479936917623
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,384,8,2,power_law_1.2,1.129753589630127
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,7168,2048,8,384,16,1,power_law_1.01,0.3214783906936646
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,7168,2048,8,384,16,1,power_law_1.01,0.2966655969619751
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,7168,2048,8,384,16,1,balanced,0.6423999865849813
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,7168,2048,8,384,16,1,balanced,0.2770400047302246
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,384,8,2,power_law_1.2,1.4999936103820801
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,7168,2048,8,384,16,1,power_law_1.01,0.30497279167175295
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,7168,2048,8,384,16,1,power_law_1.01,0.4061759948730469
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,7168,2048,8,384,16,1,balanced,0.4009600083033244
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,7168,2048,8,384,16,1,balanced,2.463792006174723
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,7168,2048,8,384,16,1,balanced,0.7459839979807535
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,7168,2048,8,384,16,1,power_law_1.01,0.32118399143218995
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,7168,2048,8,384,16,1,power_law_1.01,0.436352014541626
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,384,8,2,power_law_1.2,1.8489215850830079
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,7168,2048,8,384,16,1,balanced,0.5371679862340292
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,7168,2048,8,384,16,1,balanced,0.5448480049769083
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,7168,2048,8,384,16,1,power_law_1.01,0.34266879558563235
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,7168,2048,8,384,16,1,power_law_1.01,0.4541632175445557
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,7168,2048,8,384,16,1,balanced,0.862938642501831
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,384,8,2,power_law_1.2,2.491904067993164
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,7168,2048,8,384,16,1,balanced,0.5589866638183594
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,7168,2048,8,384,16,1,power_law_1.01,0.3625216007232666
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,7168,2048,8,384,16,1,power_law_1.01,0.4615424156188965
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,384,8,2,power_law_1.2,3.3173633575439454
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,7168,2048,8,384,16,1,balanced,0.5637919902801514
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,7168,2048,8,384,16,1,power_law_1.01,0.3831808090209961
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,7168,2048,8,384,16,1,balanced,1.0177653630574544
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,7168,2048,8,384,16,1,power_law_1.01,0.5166336059570312
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,7168,2048,8,384,16,1,balanced,0.5814293225606283
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,384,8,2,power_law_1.2,4.453542327880859
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,7168,2048,8,384,16,1,power_law_1.01,0.4136256217956543
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,7168,2048,8,384,16,1,balanced,3.4039360682169595
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,7168,2048,8,384,16,1,power_law_1.01,0.5307007789611816
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,7168,2048,8,384,16,1,balanced,0.5930613279342651
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,7168,2048,8,384,16,1,power_law_1.01,0.4471424102783203
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,7168,2048,8,384,16,1,balanced,1.2474346955617268
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,7168,2048,8,384,16,1,balanced,0.6084426641464233
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,7168,2048,8,384,16,1,power_law_1.01,0.5386623859405517
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,384,8,2,power_law_1.2,5.810969543457031
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,7168,2048,8,384,16,1,power_law_1.01,0.4726463794708252
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,7168,2048,8,384,16,1,balanced,0.6355040073394775
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,7168,2048,8,384,16,1,power_law_1.01,0.5651072025299072
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,7168,2048,8,384,16,1,power_law_1.01,0.4814911842346191
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,384,8,2,power_law_1.2,7.663871765136719
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,7168,2048,8,384,16,1,balanced,0.6853600343068441
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,7168,2048,8,384,16,1,power_law_1.01,0.585203218460083
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,7168,2048,8,384,16,1,power_law_1.01,0.13950719833374023
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,7168,2048,8,384,16,1,power_law_1.01,0.5740992069244385
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,7168,2048,8,384,16,1,balanced,0.7087732950846354
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,7168,2048,8,384,16,1,balanced,1.7089385986328125
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,7168,2048,8,384,16,1,power_law_1.01,0.6207168102264404
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,384,8,2,power_law_1.2,12.291584014892578
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,7168,2048,8,384,16,1,balanced,0.7829973697662354
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,7168,2048,8,384,16,1,power_law_1.01,0.6468992233276367
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,7168,2048,8,384,16,1,power_law_1.01,0.14531199932098388
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,7168,2048,8,384,16,1,power_law_1.01,0.7110400199890137
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,7168,2048,8,384,16,1,power_law_1.01,0.16374399662017822
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,7168,2048,8,384,16,1,power_law_1.01,0.8021696090698243
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,7168,2048,8,384,16,1,balanced,0.8952319622039795
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,7168,2048,8,384,16,1,balanced,4.237978617350261
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,7168,2048,8,384,16,1,power_law_1.01,0.19419519901275634
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,7168,2048,8,384,16,1,power_law_1.01,0.793555212020874
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,7168,2048,8,384,16,1,power_law_1.01,0.863526439666748
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,7168,2048,8,384,16,1,power_law_1.01,0.2424191951751709
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,384,8,2,power_law_1.2,24.226669311523438
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,7168,2048,8,384,16,1,balanced,2.262730598449707
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,7168,2048,8,384,16,1,power_law_1.01,0.9780799865722656
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,7168,2048,8,384,16,1,power_law_1.01,0.29553918838500975
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,7168,2048,8,384,16,1,power_law_1.01,1.0806015968322753
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,7168,2048,8,384,16,1,power_law_1.01,0.3343744039535522
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,7168,2048,8,384,16,1,power_law_1.01,1.0979519844055177
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,7168,2048,8,384,16,1,power_law_1.01,1.3036160469055176
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,7168,2048,8,384,16,1,power_law_1.01,0.3958080053329468
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,384,16,1,balanced,1.0813439687093098
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,7168,2048,8,384,16,1,power_law_1.01,1.390668773651123
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,7168,2048,8,384,16,1,power_law_1.01,0.4260223865509033
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,7168,2048,8,384,16,1,power_law_1.01,1.7648960113525392
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,7168,2048,8,384,16,1,power_law_1.01,0.4330304145812988
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,7168,2048,8,384,16,1,power_law_1.01,1.5881152153015137
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,7168,2048,8,384,16,1,power_law_1.01,2.1782400131225588
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,7168,2048,8,384,16,1,power_law_1.01,0.4584767818450928
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,7168,2048,8,384,16,1,power_law_1.01,0.4908607959747314
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,7168,2048,8,384,16,1,balanced,3.1959091822306314
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,7168,2048,8,384,16,1,power_law_1.01,2.122336006164551
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,7168,2048,8,384,16,1,power_law_1.01,3.101638412475586
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,7168,2048,8,384,16,1,power_law_1.01,0.5169983863830566
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,7168,2048,8,384,16,1,balanced,5.303690592447917
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,7168,2048,8,384,16,1,power_law_1.01,2.6220544815063476
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,7168,2048,8,384,16,1,power_law_1.01,0.5689280033111572
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,7168,2048,8,384,16,1,power_law_1.01,3.959212875366211
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,384,16,1,balanced,1.4395519892374675
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,7168,2048,8,384,16,1,power_law_1.01,0.6305280208587647
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,7168,2048,8,384,16,1,power_law_1.01,3.656108856201172
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,7168,2048,8,384,16,1,power_law_1.01,4.830956649780274
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,7168,2048,8,384,16,1,power_law_1.01,0.681663990020752
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,384,16,1,balanced,1.706160068511963
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,7168,2048,8,384,16,1,power_law_1.01,0.787014389038086
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,7168,2048,8,384,16,1,power_law_1.01,4.255545425415039
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,7168,2048,8,384,16,1,power_law_1.01,7.459782409667969
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,7168,2048,8,384,16,1,power_law_1.01,0.9987392425537109
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,384,16,1,balanced,2.0876800219217935
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,7168,2048,8,384,16,1,power_law_1.01,5.190259170532227
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,7168,2048,8,384,16,1,balanced,3.96175479888916
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,7168,2048,8,384,16,1,power_law_1.01,16.077229309082032
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,384,16,1,power_law_1.01,1.1499008178710937
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,7168,2048,8,384,16,1,power_law_1.01,8.128192138671874
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,384,16,1,balanced,2.8293066024780273
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,7168,2048,8,384,16,1,power_law_1.01,16.72150421142578
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,384,16,1,power_law_1.01,1.4057727813720704
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,384,16,1,power_law_1.01,1.7146623611450196
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,384,16,1,balanced,3.7062454223632812
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,384,16,1,power_law_1.01,2.3181119918823243
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,384,16,1,power_law_1.01,2.8946943283081055
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,7168,2048,8,384,16,1,balanced,8.061813354492188
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,384,16,1,power_law_1.01,4.042591857910156
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,7168,2048,8,384,16,1,balanced,4.970831871032715
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,384,16,1,power_law_1.01,5.192870330810547
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,384,16,1,balanced,5.303605397542317
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,384,16,1,power_law_1.01,7.494022369384766
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,384,16,1,power_law_1.01,9.809433746337891
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,384,16,1,power_law_1.01,12.080646514892578
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,384,16,1,balanced,7.218261082967122
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,7168,2048,8,384,16,1,power_law_1.2,0.07123839855194092
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,384,16,1,power_law_1.01,19.0085693359375
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,7168,2048,8,384,16,1,power_law_1.2,0.07111039757728577
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,7168,2048,8,384,16,1,power_law_1.2,0.08271359801292419
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,7168,2048,8,384,16,1,power_law_1.2,0.12099839448928833
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,384,16,1,power_law_1.01,37.431488037109375
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,7168,2048,8,384,16,1,power_law_1.2,0.16885759830474853
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,7168,2048,8,384,16,1,balanced,7.624565124511719
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,7168,2048,8,384,16,1,power_law_1.2,0.248473596572876
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,7168,2048,8,384,16,1,power_law_1.2,0.2924864053726196
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,384,16,1,balanced,9.8918825785319
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,7168,2048,8,384,16,1,power_law_1.2,0.3935744047164917
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,7168,2048,8,384,16,1,power_law_1.2,0.4109312057495117
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,7168,2048,8,384,16,1,power_law_1.2,0.4252607822418213
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,7168,2048,8,384,16,1,power_law_1.2,0.44627838134765624
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,7168,2048,8,384,16,1,power_law_1.2,0.495692777633667
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,7168,2048,8,384,16,1,power_law_1.2,0.5129151821136475
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,7168,2048,8,384,16,1,balanced,15.424490610758463
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,384,16,1,balanced,12.335104624430338
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,7168,2048,8,384,16,1,power_law_1.2,0.5395904064178467
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,7168,2048,8,384,16,1,power_law_1.2,0.5552768230438232
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,7168,2048,8,384,16,1,power_law_1.2,0.5806591987609864
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,7168,2048,8,384,16,1,power_law_1.2,0.6235904216766357
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,7168,2048,8,384,16,1,power_law_1.2,0.7376512050628662
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,7168,2048,8,384,16,1,power_law_1.2,0.7898496150970459
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,7168,2048,8,384,16,1,power_law_1.2,0.9955648422241211
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,7168,2048,8,384,16,1,power_law_1.2,1.1480768203735352
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,7168,2048,8,384,16,1,power_law_1.2,1.4403072357177735
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,7168,2048,8,384,16,1,power_law_1.2,1.6434879302978516
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,384,16,1,balanced,19.30716323852539
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,7168,2048,8,384,16,1,balanced,14.809616088867188
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,7168,2048,8,384,16,1,power_law_1.2,2.1414911270141603
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,7168,2048,8,384,16,1,power_law_1.2,2.7516864776611327
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,7168,2048,8,384,16,1,power_law_1.2,3.7815807342529295
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,7168,2048,8,384,16,1,power_law_1.2,4.3417919158935545
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,7168,2048,8,384,16,1,power_law_1.2,5.211609649658203
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,7168,2048,8,384,16,1,power_law_1.2,8.165497589111329
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,7168,2048,8,384,16,1,power_law_1.2,16.941542053222655
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,7168,2048,8,384,16,1,power_law_1.2,0.05541120171546936
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,7168,2048,8,384,16,1,power_law_1.2,0.06060799956321716
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,7168,2048,8,384,16,1,power_law_1.2,0.07007359862327575
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,7168,2048,8,384,16,1,power_law_1.2,0.09639040231704712
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,7168,2048,8,384,16,1,power_law_1.2,0.1371840000152588
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,7168,2048,8,384,16,1,power_law_1.2,0.18402559757232667
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,7168,2048,8,384,16,1,power_law_1.2,0.21016321182250977
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,7168,2048,8,384,16,1,power_law_1.2,0.28016641139984133
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,7168,2048,8,384,16,1,power_law_1.2,0.2980736017227173
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,7168,2048,8,384,16,1,power_law_1.2,0.3105792045593262
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,128,1,16,balanced,0.0582239975531896
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,7168,2048,8,384,16,1,power_law_1.2,0.3410815954208374
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,7168,2048,8,384,16,1,power_law_1.2,0.3605247974395752
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,128,1,16,balanced,0.0639466643333435
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,7168,2048,8,384,16,1,power_law_1.2,0.3728255987167358
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,128,1,16,balanced,0.06279466549555461
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,7168,2048,8,384,16,1,power_law_1.2,0.4103360176086426
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,128,1,16,balanced,0.055306668082873024
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,7168,2048,8,384,16,1,power_law_1.2,0.4339712142944336
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,384,16,1,balanced,37.90448506673177
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,128,1,16,balanced,0.0584746648867925
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,7168,2048,8,384,16,1,power_law_1.2,0.47092480659484864
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,7168,2048,8,384,16,1,power_law_1.2,0.4911231994628906
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,128,1,16,balanced,0.08215466638406117
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,7168,2048,8,384,16,1,power_law_1.2,0.5784063816070557
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,128,1,16,balanced,0.08385066191355388
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,7168,2048,8,384,16,1,power_law_1.2,0.6700928211212158
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,128,1,16,balanced,0.08352532982826233
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,7168,2048,8,384,16,1,power_law_1.2,0.13952640295028687
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,7168,2048,8,384,16,1,power_law_1.2,0.8110719680786133
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,128,1,16,balanced,0.10989866654078166
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,7168,2048,8,384,16,1,power_law_1.2,0.9106176376342774
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,7168,2048,8,384,16,1,power_law_1.2,0.14581120014190674
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,128,1,16,balanced,0.11064533392588298
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,7168,2048,8,384,16,1,power_law_1.2,1.127359962463379
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,7168,2048,8,384,16,1,power_law_1.2,0.17210240364074708
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,128,1,16,balanced,0.10949866970380147
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,7168,2048,8,384,16,1,power_law_1.2,1.3743167877197267
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,128,1,16,balanced,0.1856266657511393
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,7168,2048,8,384,16,1,power_law_1.2,0.1945024013519287
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,7168,2048,8,384,16,1,power_law_1.2,1.8235328674316407
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,128,1,16,balanced,0.18289599816004434
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,7168,2048,8,384,16,1,power_law_1.2,0.23402879238128663
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,7168,2048,8,384,16,1,power_law_1.2,2.2678207397460937
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,128,1,16,balanced,0.1824480096499125
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,7168,2048,8,384,16,1,power_law_1.2,3.1956863403320312
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,7168,2048,8,384,16,1,power_law_1.2,0.27076480388641355
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,128,1,16,power_law_1.01,0.10204160213470459
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,128,1,16,balanced,0.18110400438308716
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,7168,2048,8,384,16,1,power_law_1.2,0.30838398933410643
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,7168,2048,8,384,16,1,power_law_1.2,3.985203170776367
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,128,1,16,power_law_1.01,0.12596479654312134
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,128,1,16,balanced,0.1825760006904602
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,7168,2048,8,384,16,1,power_law_1.2,0.38236799240112307
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,7168,2048,8,384,16,1,power_law_1.2,4.852032089233399
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,128,1,16,power_law_1.01,0.0735360026359558
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,128,1,16,balanced,0.18307199080785116
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,7168,2048,8,384,16,1,power_law_1.2,0.40761599540710447
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,128,1,16,power_law_1.01,0.06202239990234375
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,128,1,16,balanced,0.18620266517003378
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,7168,2048,8,384,16,1,power_law_1.2,7.459232330322266
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,7168,2048,8,384,16,1,power_law_1.2,0.42383999824523927
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,128,1,16,power_law_1.01,0.06837760210037232
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,128,1,16,balanced,0.18826667467753092
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,128,1,16,power_law_1.01,0.08044160008430482
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,7168,2048,8,384,16,1,power_law_1.2,0.4509439945220947
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,128,1,16,balanced,0.19698667526245117
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,7168,2048,8,384,16,1,power_law_1.2,16.329318237304687
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,128,1,16,power_law_1.01,0.08035839796066284
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,7168,2048,8,384,16,1,power_law_1.2,0.47932162284851076
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,128,1,16,balanced,0.20618132750193277
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,128,1,16,power_law_1.01,0.08116480112075805
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,7168,2048,8,384,16,1,power_law_1.2,0.5110015869140625
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,128,1,16,balanced,0.22696000337600708
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,128,1,16,power_law_1.01,0.10973440408706665
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,7168,2048,8,384,16,1,power_law_1.2,0.5696447849273681
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,128,1,16,power_law_1.01,0.10568959712982177
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,128,1,16,balanced,0.24563199281692505
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,7168,2048,8,384,16,1,power_law_1.2,0.6315584182739258
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,128,1,16,power_law_1.01,0.10223360061645508
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,7168,2048,8,384,16,1,power_law_1.2,0.6910975933074951
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,128,1,16,power_law_1.2,0.1022528052330017
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,128,1,16,power_law_1.01,0.1879744052886963
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,128,1,16,balanced,0.3984533150990804
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,7168,2048,8,384,16,1,power_law_1.2,0.7948863983154297
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,128,1,16,power_law_1.2,0.11958400011062623
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,128,1,16,power_law_1.01,0.18240640163421631
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,128,1,16,power_law_1.2,0.07738879919052125
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,7168,2048,8,384,16,1,power_law_1.2,1.0076671600341798
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,128,1,16,power_law_1.01,0.18096640110015869
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,128,1,16,balanced,0.44167999426523846
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,128,1,16,power_law_1.2,0.06092159748077393
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,128,1,16,power_law_1.01,0.18365440368652344
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,128,1,16,power_law_1.2,0.0649728000164032
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,128,1,16,power_law_1.01,0.18481279611587526
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,384,16,1,power_law_1.2,1.162559986114502
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,128,1,16,power_law_1.2,0.07463039755821228
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,128,1,16,power_law_1.01,0.1825600028038025
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,128,1,16,balanced,0.6461013158162435
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,128,1,16,power_law_1.2,0.07941759824752807
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,128,1,16,power_law_1.01,0.19809279441833497
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,128,1,16,power_law_1.2,0.0823743999004364
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,384,16,1,power_law_1.2,1.429529571533203
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,128,1,16,power_law_1.01,0.21027839183807373
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,128,1,16,power_law_1.2,0.10840320587158203
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,384,16,1,power_law_1.2,1.7376575469970703
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,128,1,16,power_law_1.01,0.2600895881652832
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,128,1,16,power_law_1.2,0.10896639823913574
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,128,1,16,balanced,0.8496853510538737
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,384,16,1,power_law_1.2,2.336447906494141
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,128,1,16,power_law_1.01,0.33070080280303954
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,128,1,16,power_law_1.2,0.10687999725341797
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,128,1,16,power_law_1.01,0.3759488105773926
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,128,1,16,power_law_1.2,0.1846783995628357
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,384,16,1,power_law_1.2,2.956518363952637
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,128,1,16,power_law_1.2,0.17624959945678711
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,128,1,16,power_law_1.01,0.44550399780273436
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,384,16,1,power_law_1.2,4.085996627807617
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,128,1,16,power_law_1.2,0.1843840003013611
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,128,1,16,power_law_1.01,0.6375167846679688
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,128,2,8,balanced,0.048063998421033226
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,128,1,16,balanced,1.0518399874369304
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,128,1,16,power_law_1.2,0.19055999517440797
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,384,16,1,power_law_1.2,5.229817581176758
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,128,1,16,power_law_1.01,0.9116864204406738
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,128,2,8,balanced,0.04952000081539154
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,128,1,16,power_law_1.2,0.18838399648666382
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,128,1,16,power_law_1.01,1.2524864196777343
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,128,2,8,balanced,0.05204799771308899
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,384,16,1,power_law_1.2,7.532511901855469
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,128,2,8,balanced,0.061664000153541565
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,128,1,16,power_law_1.2,0.2042304039001465
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,128,1,16,power_law_1.01,1.6639360427856444
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,128,2,8,balanced,0.0699893335501353
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,384,16,1,power_law_1.2,9.826541137695312
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,128,1,16,power_law_1.2,0.21356160640716554
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,128,1,16,power_law_1.01,1.9996864318847656
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,128,2,8,balanced,0.08342933654785156
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,128,1,16,power_law_1.2,0.2397696018218994
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,128,2,8,balanced,0.08423999945322673
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,128,1,16,power_law_1.01,3.2960575103759764
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,384,16,1,power_law_1.2,12.116300964355469
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,128,2,8,power_law_1.01,0.07043200135231018
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,128,1,16,balanced,1.6632906595865886
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,128,1,16,power_law_1.2,0.28279039859771726
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,128,2,8,balanced,0.0839359958966573
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,128,1,16,power_law_1.01,6.056339263916016
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,128,2,8,balanced,0.07858133316040039
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,128,2,8,power_law_1.01,0.08897280097007751
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,128,1,16,power_law_1.2,0.31818881034851076
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,384,16,1,power_law_1.2,19.008428955078124
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,128,2,8,balanced,0.07906133433183034
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,128,2,8,power_law_1.01,0.07147520184516906
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,128,1,16,power_law_1.2,0.4301248073577881
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,128,2,8,balanced,0.07959466675917308
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,128,2,8,power_law_1.01,0.06627839803695679
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,128,1,16,power_law_1.2,0.6144256114959716
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,128,2,8,balanced,0.11161067088445027
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,128,2,8,power_law_1.01,0.06812800168991089
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,128,2,8,balanced,0.10827733079592387
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,128,1,16,power_law_1.2,0.8628800392150879
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,384,16,1,power_law_1.2,37.38870544433594
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,128,2,8,power_law_1.01,0.07487360239028931
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,128,2,8,balanced,0.10602133472760518
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,128,1,16,power_law_1.2,0.9819135665893555
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,128,2,8,power_law_1.01,0.08131840229034423
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,128,2,8,balanced,0.17178666591644287
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,128,1,16,power_law_1.2,1.6321023941040038
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,128,2,8,power_law_1.01,0.08197759985923767
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,128,2,8,balanced,0.17164800564448038
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,128,1,16,power_law_1.2,1.8400255203247071
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,128,2,8,balanced,0.17294933398564658
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,128,2,8,power_law_1.01,0.07763839960098266
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,128,2,8,power_law_1.01,0.07724159955978394
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,128,2,8,balanced,0.1763146718343099
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,128,1,16,power_law_1.2,2.69803524017334
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,128,2,8,power_law_1.01,0.07678080201148987
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,128,2,8,balanced,0.17883733908335367
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,128,1,16,power_law_1.2,4.345574569702149
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,128,1,16,balanced,3.290890693664551
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,128,2,8,power_law_1.01,0.10623999834060668
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,128,2,8,balanced,0.1879253387451172
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,128,2,8,power_law_1.01,0.10563839673995971
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,128,2,8,balanced,0.19693867365519205
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,128,1,16,power_law_1.2,10.22974090576172
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,128,2,8,power_law_1.01,0.10663679838180543
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,128,2,8,balanced,0.2183306614557902
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,128,2,8,power_law_1.01,0.17500799894332886
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,128,2,8,power_law_1.01,0.1784127950668335
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,128,2,8,balanced,0.23894399404525757
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,128,2,8,power_law_1.01,0.1776703953742981
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,128,2,8,power_law_1.01,0.20590720176696778
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,128,2,8,balanced,0.4046826759974162
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,128,2,8,power_law_1.2,0.07136639952659607
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,128,2,8,power_law_1.01,0.21719679832458497
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,128,2,8,power_law_1.2,0.08332160115242004
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,128,2,8,power_law_1.01,0.23793280124664307
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,128,2,8,balanced,0.44582398732503253
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,128,2,8,power_law_1.2,0.0610368013381958
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,128,2,8,power_law_1.01,0.2745471954345703
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,128,2,8,power_law_1.2,0.07006080150604248
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,128,2,8,power_law_1.01,0.36937599182128905
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,128,2,8,power_law_1.2,0.067603200674057
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,128,2,8,power_law_1.01,0.3809407949447632
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,128,2,8,balanced,0.6509759823481241
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,128,2,8,power_law_1.2,0.06680960059165955
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,128,2,8,power_law_1.01,0.6278528213500977
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,128,2,8,power_law_1.2,0.08138239979743958
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,128,2,8,power_law_1.01,0.676639986038208
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,128,2,8,power_law_1.2,0.08280959725379944
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,128,2,8,power_law_1.01,0.9912960052490234
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,128,2,8,balanced,0.854144016901652
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,128,2,8,power_law_1.2,0.07704960107803345
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,128,2,8,power_law_1.01,1.255679988861084
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,128,2,8,power_law_1.2,0.07844480276107788
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,128,2,8,power_law_1.01,1.5683712005615233
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,128,2,8,power_law_1.2,0.0774399995803833
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,128,4,4,balanced,0.033370666205883026
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,128,2,8,power_law_1.01,2.660121536254883
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,128,2,8,power_law_1.2,0.11141760349273681
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,128,4,4,balanced,0.0379573330283165
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,128,4,4,balanced,0.03862933317820231
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,128,2,8,balanced,1.0594613552093506
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,128,2,8,power_law_1.01,4.5053760528564455
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,128,2,8,power_law_1.2,0.10938880443572999
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,128,4,4,balanced,0.04756799836953481
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,128,4,4,balanced,0.06347733239332835
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,128,2,8,power_law_1.2,0.09960960149765015
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,128,4,4,balanced,0.07314666608969371
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,128,4,4,balanced,0.07326933244864146
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,128,2,8,power_law_1.2,0.17749760150909424
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,128,4,4,balanced,0.08061866462230682
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,128,2,8,power_law_1.2,0.18332159519195557
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,128,4,4,balanced,0.08069866895675659
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,128,4,4,balanced,0.08110400040944417
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,128,2,8,power_law_1.2,0.18540159463882447
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,128,4,4,balanced,0.08186133205890656
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,128,2,8,balanced,1.6761706670125325
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,128,4,4,balanced,0.08094933132330577
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,128,2,8,power_law_1.2,0.21503360271453859
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,128,4,4,balanced,0.08098133405049641
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,128,2,8,power_law_1.2,0.2210752010345459
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,128,4,4,balanced,0.08157866696516673
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,128,4,4,balanced,0.11033599575360616
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,128,2,8,power_law_1.2,0.26640000343322756
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,128,4,4,balanced,0.11106666922569275
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,128,2,8,power_law_1.2,0.28701438903808596
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,128,4,4,balanced,0.11224533120791118
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,128,4,4,balanced,0.18416533867518106
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,128,2,8,power_law_1.2,0.3763008117675781
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,128,4,4,balanced,0.1865440011024475
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,128,2,8,power_law_1.2,0.4739520072937012
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,128,4,4,balanced,0.19688532749811807
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,128,2,8,power_law_1.2,0.6595263957977295
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,128,4,4,balanced,0.20388267437616983
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,128,2,8,power_law_1.2,0.8571071624755859
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,128,4,4,balanced,0.22406933705012003
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,128,2,8,power_law_1.2,1.2562111854553222
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,128,4,4,balanced,0.24409067630767822
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,128,2,8,power_law_1.2,1.5142720222473145
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,128,4,4,balanced,0.41253864765167236
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,128,2,8,power_law_1.2,1.7955583572387694
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,128,2,8,balanced,3.311471939086914
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,128,2,8,power_law_1.2,3.192678451538086
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,128,4,4,balanced,0.4530400037765503
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,128,2,8,power_law_1.2,6.165958404541016
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,128,4,4,balanced,0.6589546600977579
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,128,4,4,balanced,0.8664906819661459
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,128,4,4,power_law_1.01,0.03568640053272247
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,128,4,4,power_law_1.01,0.04200960099697113
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,128,4,4,balanced,1.0707253615061443
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,128,4,4,power_law_1.01,0.04349440038204193
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,128,4,4,power_law_1.01,0.05175039768218994
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,128,4,4,power_law_1.2,0.035104000568389894
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,128,4,4,power_law_1.01,0.06007680296897888
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,128,4,4,power_law_1.2,0.04149760007858276
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,128,4,4,power_law_1.01,0.06622719764709473
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,128,4,4,power_law_1.2,0.04037759900093078
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,128,4,4,power_law_1.01,0.06962559819221496
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,128,4,4,power_law_1.2,0.05071359872817993
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,128,4,4,power_law_1.01,0.073990398645401
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,128,4,4,balanced,1.6883519490559895
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,128,4,4,power_law_1.2,0.05857279896736145
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,128,4,4,power_law_1.01,0.07952640056610108
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,128,4,4,power_law_1.2,0.06312959790229797
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,128,4,4,power_law_1.01,0.07551360130310059
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,128,4,4,power_law_1.2,0.07061759829521179
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,128,4,4,power_law_1.01,0.07775359749794006
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,128,4,4,power_law_1.2,0.07653759717941284
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,128,8,2,balanced,0.02951466788848241
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,128,4,4,power_law_1.01,0.07872639894485474
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,128,8,2,power_law_1.01,0.029772800207138062
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,128,4,4,power_law_1.2,0.07485439777374267
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,128,8,2,balanced,0.033728001018365227
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,128,4,4,power_law_1.01,0.07959039807319641
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,128,4,4,power_law_1.2,0.07927680015563965
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,128,8,2,power_law_1.01,0.0343423992395401
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,128,8,2,balanced,0.0359946663180987
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,128,4,4,power_law_1.01,0.08247039914131164
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,128,8,2,balanced,0.04504533112049103
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,128,4,4,power_law_1.2,0.0800320029258728
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,128,8,2,power_law_1.01,0.037011200189590455
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,128,4,4,power_law_1.01,0.10856319665908813
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,128,8,2,power_law_1.01,0.0459199994802475
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,128,4,4,power_law_1.2,0.07959679961204529
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,128,8,2,balanced,0.06313066681226094
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,128,8,2,power_law_1.01,0.053625601530075076
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,128,4,4,power_law_1.2,0.07982720136642456
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,128,4,4,power_law_1.01,0.11238399744033814
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,128,4,4,power_law_1.2,0.08484479784965515
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,128,4,4,power_law_1.01,0.11537280082702636
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,128,8,2,balanced,0.08111999928951263
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,128,8,2,power_law_1.01,0.06152960062026978
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,128,4,4,power_law_1.2,0.10928000211715698
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,128,4,4,balanced,3.3367414474487305
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,128,4,4,power_law_1.01,0.18804479837417604
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,128,8,2,balanced,0.07642666498819987
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,128,8,2,power_law_1.01,0.06940799951553345
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,128,4,4,power_law_1.2,0.11631360054016113
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,128,4,4,power_law_1.01,0.205184006690979
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,128,8,2,balanced,0.07640000184377034
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,128,8,2,power_law_1.01,0.07095040082931518
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,128,4,4,power_law_1.2,0.11424640417099
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,128,8,2,balanced,0.07650133470694225
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,128,4,4,power_law_1.01,0.2284032106399536
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,128,8,2,power_law_1.01,0.07099519968032837
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,128,4,4,power_law_1.2,0.20782079696655273
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,128,8,2,balanced,0.07635200023651123
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,128,4,4,power_law_1.01,0.26238079071044923
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,128,8,2,power_law_1.01,0.07186560034751892
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,128,4,4,power_law_1.2,0.22115840911865234
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,128,8,2,balanced,0.08425066868464152
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,128,4,4,power_law_1.01,0.32933759689331055
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,128,8,2,power_law_1.01,0.08058879971504211
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,128,8,2,balanced,0.08403733372688293
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,128,4,4,power_law_1.2,0.24791040420532226
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,128,4,4,power_law_1.01,0.3775871992111206
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,128,8,2,power_law_1.01,0.08174719810485839
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,128,8,2,balanced,0.08441600203514099
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,128,4,4,power_law_1.2,0.29576959609985354
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,128,4,4,power_law_1.01,0.574944019317627
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,128,8,2,power_law_1.01,0.08386560082435608
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,128,8,2,balanced,0.08544533451398213
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,128,4,4,power_law_1.2,0.3635008096694946
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,128,8,2,power_law_1.01,0.08579199910163879
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,128,8,2,balanced,0.08668266733487447
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,128,4,4,power_law_1.01,0.6180223941802978
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,128,4,4,power_law_1.2,0.43980798721313474
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,128,8,2,balanced,0.08744000395139058
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,128,8,2,power_law_1.01,0.08615040183067321
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,128,4,4,power_law_1.01,0.9094592094421386
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,128,4,4,power_law_1.2,0.6000768184661865
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,128,8,2,balanced,0.09009599685668945
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,128,8,2,power_law_1.01,0.09950079917907714
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,128,4,4,power_law_1.01,1.1593536376953124
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,128,4,4,power_law_1.2,0.7459839820861817
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,128,8,2,balanced,0.1252959966659546
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,128,8,2,power_law_1.01,0.10239360332489014
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,128,8,2,power_law_1.2,0.03025279939174652
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,128,4,4,power_law_1.2,0.9465984344482422
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,128,4,4,power_law_1.01,1.3873087882995605
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,128,8,2,balanced,0.12898133198420206
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,128,8,2,power_law_1.01,0.12991360425949097
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,128,8,2,power_law_1.2,0.034508800506591795
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,128,4,4,power_law_1.2,1.2356672286987305
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,128,4,4,power_law_1.01,2.400339126586914
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,128,8,2,balanced,0.2141759991645813
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,128,8,2,power_law_1.01,0.13902080059051514
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,128,8,2,power_law_1.2,0.03436160087585449
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,128,4,4,power_law_1.2,1.4880576133728027
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,128,8,2,balanced,0.22403200467427573
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,128,8,2,power_law_1.01,0.24917759895324706
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,128,4,4,power_law_1.01,4.172921752929687
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,128,8,2,power_law_1.2,0.045824000239372255
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,128,4,4,power_law_1.2,2.530067253112793
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,128,8,2,power_law_1.01,0.2702784061431885
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,128,8,2,balanced,0.24703466892242432
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,128,8,2,power_law_1.2,0.05333120226860046
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,128,8,2,power_law_1.01,0.3330751895904541
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,128,4,4,power_law_1.2,5.986003112792969
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,128,8,2,power_law_1.2,0.057785600423812866
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,128,8,2,balanced,0.26761066913604736
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,128,8,2,power_law_1.01,0.3937664031982422
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,128,8,2,power_law_1.2,0.0686847984790802
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,128,8,2,power_law_1.01,0.5107391834259033
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,128,8,2,balanced,0.4547040065129598
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,128,8,2,power_law_1.2,0.07023360133171082
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,128,8,2,power_law_1.01,0.6301887989044189
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,128,8,2,power_law_1.2,0.0710591971874237
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,128,8,2,balanced,0.4973173141479492
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,128,8,2,power_law_1.01,0.8833215713500977
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,128,8,2,power_law_1.2,0.07197440266609192
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,128,8,2,power_law_1.01,1.1233280181884766
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,128,8,2,power_law_1.2,0.08008959889411926
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,128,8,2,power_law_1.01,1.3535103797912598
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,128,8,2,power_law_1.2,0.08186240196228027
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,128,8,2,balanced,0.7240746815999349
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,128,8,2,power_law_1.2,0.08362879753112792
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,128,8,2,power_law_1.01,2.092537689208984
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,128,8,2,power_law_1.2,0.08709759712219238
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,128,8,2,power_law_1.01,4.0742847442626955
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,128,8,2,power_law_1.2,0.0858240008354187
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,128,8,2,balanced,0.9490613142649332
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,128,8,2,power_law_1.2,0.09981439709663391
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,128,16,1,balanced,0.02569066733121872
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,128,16,1,power_law_1.01,0.025337600708007814
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,128,8,2,power_law_1.2,0.10463999509811402
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,128,16,1,balanced,0.02945599953333537
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,128,16,1,power_law_1.01,0.0286655992269516
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,128,8,2,power_law_1.2,0.13345919847488402
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,128,16,1,balanced,0.03279466678698858
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,128,16,1,power_law_1.01,0.03175680041313171
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,128,16,1,balanced,0.046096002062161766
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,128,8,2,power_law_1.2,0.14257279634475709
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,128,16,1,power_law_1.01,0.04068480134010315
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,128,8,2,balanced,1.1756906509399414
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,128,16,1,balanced,0.06446933249632518
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,128,8,2,power_law_1.2,0.2594815969467163
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,128,16,1,power_law_1.01,0.05119360089302063
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,128,8,2,power_law_1.2,0.2945472002029419
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,128,16,1,balanced,0.0965226689974467
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,128,8,2,power_law_1.2,0.3669312000274658
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,128,16,1,power_law_1.01,0.05912320017814636
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,128,8,2,power_law_1.2,0.40981121063232423
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,128,16,1,balanced,0.09353599945704143
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,128,16,1,power_law_1.01,0.07308800220489502
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,128,16,1,balanced,0.09273599584897359
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,128,8,2,power_law_1.2,0.544921588897705
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,128,16,1,power_law_1.01,0.07669119834899903
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,128,8,2,balanced,1.8473013242085774
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,128,16,1,balanced,0.0895146628220876
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,128,8,2,power_law_1.2,0.690937614440918
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,128,16,1,balanced,0.08919466535250346
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,128,16,1,power_law_1.01,0.08134400248527526
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,128,8,2,power_law_1.2,0.8805567741394043
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,128,16,1,balanced,0.08937600255012512
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,128,8,2,power_law_1.2,1.1879039764404298
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,128,16,1,power_law_1.01,0.0824512004852295
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,128,16,1,balanced,0.08973866701126099
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,128,8,2,power_law_1.2,1.5374336242675781
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,128,16,1,power_law_1.01,0.08316159844398499
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,128,16,1,balanced,0.08994133273760478
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,128,8,2,power_law_1.2,2.2293184280395506
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,128,16,1,balanced,0.09113066395123799
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,128,16,1,power_law_1.01,0.08546559810638428
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,128,16,1,balanced,0.0918293297290802
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,128,16,1,power_law_1.01,0.08693119883537292
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,128,8,2,power_law_1.2,4.070975875854492
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,128,16,1,balanced,0.09409067034721375
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,128,16,1,power_law_1.01,0.0982591986656189
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,128,16,1,balanced,0.09713066617647807
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,128,16,1,power_law_1.01,0.10549119710922242
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,128,16,1,balanced,0.11525332927703857
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,128,16,1,power_law_1.01,0.11521279811859131
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,128,16,1,balanced,0.12149332960446675
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,128,16,1,power_law_1.01,0.12630399465560913
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,128,8,2,balanced,3.6390612920125327
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,128,16,1,balanced,0.16193600495656332
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,128,16,1,power_law_1.01,0.14387199878692628
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,128,16,1,balanced,0.17308266957600912
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,128,16,1,power_law_1.01,0.16622719764709473
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,128,16,1,balanced,0.3248639901479085
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,128,16,1,power_law_1.01,0.20495998859405518
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,128,16,1,power_law_1.01,0.24506239891052245
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,128,16,1,balanced,0.34959999720255536
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,128,16,1,power_law_1.2,0.02503040134906769
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,128,16,1,power_law_1.01,0.4279935836791992
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,128,16,1,power_law_1.2,0.02858879864215851
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,128,16,1,power_law_1.01,0.504633617401123
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,128,16,1,balanced,0.6090666850407919
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,128,16,1,power_law_1.2,0.03118720054626465
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,128,16,1,power_law_1.01,0.6568640232086181
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,128,16,1,power_law_1.2,0.03946239948272705
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,128,16,1,power_law_1.01,0.811359977722168
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,128,16,1,power_law_1.2,0.046758401393890384
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,128,16,1,balanced,0.6586879889170328
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,128,16,1,power_law_1.2,0.05550720095634461
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,128,16,1,power_law_1.01,1.1072447776794434
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,128,16,1,power_law_1.2,0.07328640222549439
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,128,16,1,power_law_1.01,1.407705593109131
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,128,16,1,balanced,0.9603679974873861
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,128,16,1,power_law_1.2,0.07454079985618592
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,128,16,1,power_law_1.01,1.7077951431274414
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,128,16,1,power_law_1.2,0.0794048011302948
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,128,16,1,power_law_1.01,2.6043840408325196
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,128,16,1,power_law_1.2,0.08050559759140015
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,128,16,1,power_law_1.2,0.08310400247573853
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,128,16,1,power_law_1.01,5.002483367919922
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,128,16,1,balanced,1.2638506889343262
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,128,16,1,power_law_1.2,0.08787840008735656
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,128,16,1,power_law_1.2,0.08873599767684937
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,128,16,1,power_law_1.2,0.1000704050064087
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,128,16,1,power_law_1.2,0.11159679889678956
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,128,16,1,power_law_1.2,0.11684479713439941
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,128,16,1,balanced,1.5652960141499836
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,128,16,1,power_law_1.2,0.1333567976951599
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,128,16,1,power_law_1.2,0.14580479860305787
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,128,16,1,power_law_1.2,0.1675647974014282
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,128,16,1,power_law_1.2,0.21314558982849122
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,128,16,1,power_law_1.2,0.2565376043319702
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,128,16,1,balanced,2.4662453333536782
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,128,16,1,power_law_1.2,0.4427648067474365
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,128,16,1,power_law_1.2,0.5255680084228516
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,128,16,1,power_law_1.2,0.6705152034759522
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,128,16,1,power_law_1.2,0.8218560218811035
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,128,16,1,power_law_1.2,1.1145919799804687
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,32,1,16,balanced,0.0547680010398229
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,32,1,16,power_law_1.01,0.06652160286903382
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,128,16,1,power_law_1.2,1.4151424407958983
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,32,1,16,power_law_1.2,0.06667519807815551
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,128,16,1,power_law_1.2,1.7146879196166993
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,128,16,1,power_law_1.2,2.6038335800170898
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,32,1,16,balanced,0.05624000231424967
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,32,1,16,power_law_1.2,0.06085759997367859
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,128,16,1,power_law_1.2,4.999910354614258
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,32,1,16,power_law_1.01,0.06080639958381653
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,128,16,1,balanced,4.868154525756836
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,32,1,16,balanced,0.0554720014333725
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,32,1,16,power_law_1.2,0.060198402404785155
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,32,1,16,power_law_1.01,0.06257280111312866
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,32,1,16,balanced,0.05403733253479004
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,32,1,16,power_law_1.2,0.05651199817657471
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,32,1,16,power_law_1.01,0.05541120171546936
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,32,1,16,balanced,0.058880001306533813
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,32,1,16,power_law_1.2,0.05864319801330566
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,32,1,16,power_law_1.01,0.05923200249671936
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,32,1,16,power_law_1.2,0.06836479902267456
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,32,1,16,balanced,0.06619200110435486
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,32,1,16,power_law_1.01,0.06804479956626892
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,32,1,16,power_law_1.2,0.07518720030784606
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,32,1,16,power_law_1.01,0.07459200024604798
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,32,2,8,balanced,0.04646400113900503
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,32,1,16,balanced,0.0747626672188441
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,32,1,16,power_law_1.2,0.07518079876899719
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,32,1,16,power_law_1.01,0.0747327983379364
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,32,1,16,power_law_1.2,0.08446720242500305
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,32,1,16,power_law_1.01,0.0880511999130249
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,32,1,16,balanced,0.07524266839027405
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,32,2,8,balanced,0.04773866633574168
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,32,1,16,power_law_1.2,0.08550400137901307
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,32,1,16,power_law_1.01,0.08410239815711976
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,32,1,16,power_law_1.2,0.0884607970714569
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,32,1,16,balanced,0.0874826709429423
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,32,1,16,power_law_1.01,0.08835840225219727
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,32,2,8,power_law_1.01,0.06051200032234192
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,32,1,16,power_law_1.2,0.0906175971031189
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,32,2,8,balanced,0.050144001841545105
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,32,1,16,power_law_1.01,0.08629119992256165
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,32,1,16,balanced,0.08624533812204997
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,32,2,8,power_law_1.01,0.05445759892463684
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,32,1,16,power_law_1.2,0.10027519464492798
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,32,2,8,balanced,0.04937600096066793
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,32,1,16,power_law_1.01,0.08661119937896729
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,32,1,16,balanced,0.08574933807055156
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,32,2,8,power_law_1.01,0.05729280114173889
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,32,2,8,balanced,0.05020800232887268
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,32,1,16,power_law_1.2,0.10016000270843506
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,32,1,16,power_law_1.01,0.10431360006332398
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,32,1,16,balanced,0.08572266499201457
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,32,2,8,power_law_1.01,0.050995200872421265
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,32,2,8,balanced,0.05471999943256378
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,32,1,16,power_law_1.2,0.11239680051803588
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,32,1,16,power_law_1.01,0.10495359897613525
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,32,1,16,balanced,0.08715200424194336
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,32,2,8,power_law_1.01,0.04958080053329468
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,32,2,8,balanced,0.06198933223883311
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,32,1,16,power_law_1.2,0.11375360488891602
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,32,1,16,power_law_1.01,0.10748800039291381
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,32,2,8,power_law_1.01,0.05430399775505066
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,32,1,16,balanced,0.08676266670227051
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,32,2,8,balanced,0.061674664417902626
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,32,1,16,power_law_1.2,0.11755520105361938
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,32,1,16,power_law_1.01,0.11561599969863892
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,32,2,8,power_law_1.01,0.06225280165672302
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,32,2,8,balanced,0.06946133573849995
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,32,1,16,balanced,0.08730666836102803
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,32,1,16,power_law_1.2,0.19032319784164428
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,32,1,16,power_law_1.01,0.17250560522079467
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,32,2,8,power_law_1.01,0.06159359812736511
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,32,2,8,balanced,0.0689279983441035
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,32,1,16,balanced,0.08788266777992249
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,32,1,16,power_law_1.2,0.22097280025482177
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,32,1,16,power_law_1.01,0.1866943955421448
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,32,2,8,power_law_1.01,0.07575039863586426
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,32,2,8,balanced,0.06995733578999837
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,32,1,16,balanced,0.09108799695968628
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,32,1,16,power_law_1.2,0.3072000026702881
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,32,1,16,power_law_1.01,0.27691519260406494
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,32,2,8,power_law_1.01,0.07299200296401978
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,32,2,8,balanced,0.07017600039641063
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,32,1,16,balanced,0.09540266791979472
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,32,1,16,power_law_1.2,0.3788288116455078
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,32,1,16,power_law_1.01,0.3560192108154297
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,32,2,8,power_law_1.01,0.073471999168396
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,32,2,8,balanced,0.07005866865317027
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,32,1,16,balanced,0.09844266374905904
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,32,1,16,power_law_1.2,0.5189951896667481
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,32,2,8,power_law_1.01,0.07500159740447998
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,32,1,16,power_law_1.01,0.44737920761108396
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,32,2,8,balanced,0.0705866664648056
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,32,1,16,power_law_1.2,0.8025216102600098
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,32,1,16,balanced,0.12819199760754904
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,32,2,8,power_law_1.01,0.07426559925079346
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,32,2,8,power_law_1.2,0.05916799902915955
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,32,2,8,balanced,0.07212266822655995
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,32,1,16,power_law_1.01,0.5662208080291748
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,32,1,16,power_law_1.2,1.042470359802246
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,32,2,8,power_law_1.01,0.08140159845352173
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,32,1,16,balanced,0.13506666819254556
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,32,2,8,power_law_1.2,0.05805439949035644
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,32,2,8,balanced,0.07273066540559132
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,32,1,16,power_law_1.01,1.031443214416504
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,32,2,8,power_law_1.01,0.07403519749641418
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,32,1,16,power_law_1.2,1.5850751876831055
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,32,2,8,power_law_1.2,0.05578879714012146
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,32,1,16,balanced,0.21019200483957926
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,32,2,8,balanced,0.07355733215808868
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,32,2,8,power_law_1.01,0.10952320098876953
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,32,1,16,power_law_1.01,0.9966464042663574
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,32,1,16,power_law_1.2,2.7732927322387697
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,32,2,8,power_law_1.2,0.051635199785232545
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,32,2,8,power_law_1.01,0.11817599534988403
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,32,2,8,balanced,0.0780213326215744
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,32,1,16,balanced,0.23785066604614258
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,32,1,16,power_law_1.01,1.8087488174438477
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,32,1,16,power_law_1.2,3.493318557739258
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,32,2,8,power_law_1.2,0.04990079998970032
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,32,2,8,power_law_1.01,0.13481600284576417
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,32,2,8,balanced,0.08166400094827016
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,32,2,8,power_law_1.2,0.05486720204353333
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,32,2,8,power_law_1.01,0.1639680027961731
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,32,1,16,power_law_1.01,2.5481151580810546
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,32,1,16,power_law_1.2,4.153849411010742
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,32,2,8,balanced,0.1327839990456899
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,32,1,16,balanced,0.3485120137532552
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,32,2,8,power_law_1.2,0.06256639957427979
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,32,2,8,power_law_1.01,0.21456639766693114
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,32,1,16,power_law_1.01,3.100435256958008
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,32,1,16,power_law_1.2,7.773804473876953
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,32,2,8,balanced,0.13869333267211914
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,32,2,8,power_law_1.2,0.06219519972801209
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,32,2,8,power_law_1.01,0.22179200649261474
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,32,1,16,balanced,0.4321173429489136
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,32,2,8,power_law_1.2,0.073471999168396
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,32,1,16,power_law_1.01,5.292089462280273
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,32,2,8,power_law_1.01,0.32755839824676514
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,32,2,8,balanced,0.1983519991238912
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,32,1,16,power_law_1.2,15.205107116699219
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,32,2,8,power_law_1.2,0.07603840231895446
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,32,2,8,power_law_1.01,0.4594560146331787
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,32,1,16,power_law_1.01,10.621158599853516
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,32,2,8,power_law_1.2,0.07804800271987915
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,32,2,8,balanced,0.2285333275794983
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,32,2,8,power_law_1.01,0.6780032157897949
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,32,1,16,balanced,0.6346133152643839
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,32,2,8,power_law_1.2,0.07807999849319458
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,32,2,8,power_law_1.01,0.8177215576171875
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,32,2,8,balanced,0.3327680031458537
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,32,2,8,power_law_1.2,0.07594239711761475
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,32,2,8,power_law_1.01,1.48602237701416
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,32,2,8,power_law_1.2,0.09355520009994507
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,32,2,8,power_law_1.01,1.9749439239501954
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,32,2,8,power_law_1.2,0.10151679515838623
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,32,2,8,balanced,0.4331146478652954
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,32,1,16,balanced,0.8329439957936605
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,32,2,8,power_law_1.2,0.11027840375900269
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,32,2,8,power_law_1.01,2.2175615310668944
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,32,2,8,power_law_1.2,0.11983360052108764
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,32,2,8,power_law_1.01,3.7948287963867187
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,32,2,8,power_law_1.2,0.14194560050964355
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,32,2,8,balanced,0.6343253453572592
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,32,2,8,power_law_1.01,7.5195457458496096
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,32,2,8,power_law_1.2,0.17160320281982422
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,32,1,16,balanced,1.037221352259318
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,32,4,4,balanced,0.032287999987602234
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,32,2,8,power_law_1.2,0.2425920009613037
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,32,4,4,balanced,0.03708266715208689
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,32,2,8,power_law_1.2,0.28580479621887206
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,32,2,8,balanced,0.8361120223999023
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,32,4,4,balanced,0.037952000896135964
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,32,2,8,power_law_1.2,0.45056638717651365
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,32,4,4,balanced,0.043824002146720886
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,32,2,8,power_law_1.2,0.4876992225646973
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,32,2,8,power_law_1.2,0.8304896354675293
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,32,4,4,balanced,0.042992000778516136
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,32,2,8,power_law_1.2,1.0989824295043946
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,32,1,16,balanced,1.6413440704345703
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,32,4,4,balanced,0.04121066629886627
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,32,2,8,balanced,1.0410186449686687
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,32,4,4,power_law_1.01,0.03326080143451691
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,32,4,4,balanced,0.04489600161711375
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,32,2,8,power_law_1.2,1.825279998779297
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,32,4,4,power_law_1.01,0.03710080087184906
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,32,4,4,power_law_1.01,0.037887999415397645
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,32,4,4,balanced,0.04481600224971771
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,32,2,8,power_law_1.2,2.299673652648926
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,32,4,4,power_law_1.01,0.044012799859046936
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,32,4,4,power_law_1.01,0.04291839897632599
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,32,2,8,power_law_1.2,2.5735679626464845
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,32,4,4,power_law_1.01,0.041068801283836366
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,32,4,4,balanced,0.052815998593966164
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,32,2,8,power_law_1.2,4.742636871337891
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,32,4,4,power_law_1.01,0.04402559995651245
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,32,4,4,power_law_1.01,0.04384639859199524
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,32,4,4,balanced,0.050293331344922386
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,32,4,4,power_law_1.01,0.055225598812103274
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,32,4,4,balanced,0.05045333504676819
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,32,2,8,balanced,1.6439414024353027
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,32,2,8,power_law_1.2,11.502848052978516
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,32,4,4,power_law_1.01,0.05324159860610962
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,32,4,4,power_law_1.01,0.05576320290565491
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,32,4,4,balanced,0.08078933258851369
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,32,4,4,power_law_1.01,0.0834176003932953
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,32,4,4,balanced,0.07236266632874806
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,32,4,4,power_law_1.01,0.07880319952964783
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,32,1,16,balanced,3.2489919662475586
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,32,4,4,balanced,0.07248533268769582
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,32,4,4,power_law_1.01,0.08097919821739197
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,32,4,4,balanced,0.07486933469772339
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,32,4,4,power_law_1.01,0.08054400086402894
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,32,4,4,power_law_1.01,0.08415359854698182
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,32,4,4,balanced,0.07515733440717061
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,32,4,4,power_law_1.01,0.09226239919662475
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,32,4,4,balanced,0.07672533392906189
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,32,4,4,power_law_1.01,0.11742080450057983
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,32,4,4,power_law_1.01,0.15075199604034423
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,32,4,4,balanced,0.08125866452852885
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,32,4,4,power_law_1.01,0.1712831974029541
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,32,4,4,balanced,0.08488532900810242
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,32,4,4,power_law_1.01,0.23389439582824706
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,32,4,4,balanced,0.12896000345547995
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,32,2,8,balanced,3.2571840286254883
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,32,4,4,power_law_1.01,0.28638720512390137
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,32,4,4,power_law_1.01,0.35971839427948
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,32,4,4,balanced,0.13747732837994894
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,32,4,4,power_law_1.01,0.4443647861480713
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,32,4,4,power_law_1.01,0.6349631786346436
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,32,4,4,balanced,0.1954186757405599
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,32,4,4,power_law_1.01,0.9674816131591797
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,32,4,4,balanced,0.23272534211476645
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,32,4,4,power_law_1.01,1.2542719841003418
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,32,4,4,power_law_1.01,1.901740837097168
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,32,4,4,balanced,0.34385065237681073
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,32,4,4,power_law_1.01,2.5202495574951174
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,32,4,4,power_law_1.01,5.049663925170899
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,32,4,4,balanced,0.43936534722646076
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,32,4,4,balanced,0.6453226804733276
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,32,4,4,balanced,0.8509600162506104
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,32,4,4,balanced,1.0524906317392986
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,32,4,4,power_law_1.2,0.03342719972133636
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,32,4,4,power_law_1.2,0.03706879913806915
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,32,4,4,power_law_1.2,0.037536001205444335
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,32,4,4,power_law_1.2,0.04152320027351379
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,32,8,2,balanced,0.02903999884923299
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,32,4,4,power_law_1.2,0.04281600117683411
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,32,4,4,balanced,1.6661386489868164
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,32,4,4,power_law_1.2,0.04142720103263855
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,32,8,2,balanced,0.032655999064445496
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,32,8,2,balanced,0.0347626656293869
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,32,4,4,power_law_1.2,0.046028798818588255
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,32,8,2,balanced,0.041477332512537636
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,32,4,4,power_law_1.2,0.05130879878997803
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,32,4,4,power_law_1.2,0.05671679973602295
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,32,8,2,balanced,0.04177066683769226
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,32,4,4,power_law_1.2,0.05308799743652344
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,32,8,2,balanced,0.04238399863243103
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,32,4,4,power_law_1.2,0.060115200281143186
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,32,8,2,power_law_1.01,0.02908160090446472
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,32,8,2,balanced,0.04200533529122671
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,32,4,4,power_law_1.2,0.08232319951057435
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,32,8,2,balanced,0.04194133480389913
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,32,8,2,power_law_1.01,0.03247359991073608
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,32,4,4,power_law_1.2,0.0794048011302948
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,32,8,2,power_law_1.01,0.033523198962211606
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,32,4,4,power_law_1.2,0.07992960214614868
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,32,8,2,power_law_1.01,0.03868159949779511
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,32,8,2,balanced,0.04530133306980133
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,32,4,4,power_law_1.2,0.07914239764213563
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,32,8,2,power_law_1.01,0.04335359930992126
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,32,4,4,power_law_1.2,0.08572800159454345
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,32,8,2,balanced,0.04423466821511587
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,32,8,2,power_law_1.01,0.04384639859199524
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,32,4,4,balanced,3.3046239217122397
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,32,4,4,power_law_1.2,0.10703359842300415
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,32,8,2,balanced,0.045066664616266884
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,32,8,2,power_law_1.01,0.04856959879398346
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,32,4,4,power_law_1.2,0.11694719791412353
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,32,8,2,power_law_1.01,0.04937599897384644
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,32,4,4,power_law_1.2,0.14235520362854004
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,32,8,2,power_law_1.01,0.05363199710845947
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,32,8,2,balanced,0.05459733307361603
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,32,4,4,power_law_1.2,0.19470720291137694
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,32,8,2,power_law_1.01,0.05429760217666626
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,32,8,2,balanced,0.05286933481693268
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,32,8,2,power_law_1.01,0.055692797899246214
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,32,4,4,power_law_1.2,0.2138240098953247
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,32,8,2,balanced,0.054005334774653115
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,32,4,4,power_law_1.2,0.3020927906036377
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,32,8,2,power_law_1.01,0.057580798864364624
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,32,8,2,power_law_1.2,0.029164800047874452
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,32,8,2,power_law_1.01,0.0648256003856659
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,32,4,4,power_law_1.2,0.45865597724914553
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,32,8,2,power_law_1.2,0.032313600182533264
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,32,8,2,power_law_1.01,0.06563839912414551
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,32,4,4,power_law_1.2,0.559449577331543
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,32,8,2,balanced,0.0804906686147054
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,32,8,2,power_law_1.2,0.032467201352119446
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,32,8,2,power_law_1.01,0.0909056007862091
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,32,4,4,power_law_1.2,0.8068479537963867
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,32,8,2,balanced,0.07537599901358287
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,32,8,2,power_law_1.2,0.03911679983139038
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,32,8,2,power_law_1.01,0.08391039967536926
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,32,8,2,balanced,0.07817066709200542
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,32,8,2,power_law_1.2,0.043532800674438474
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,32,4,4,power_law_1.2,1.1864255905151366
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,32,8,2,power_law_1.01,0.09026560187339783
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,32,8,2,power_law_1.2,0.0434688001871109
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,32,8,2,balanced,0.08231999973456065
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,32,4,4,power_law_1.2,1.6278656005859375
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,32,8,2,power_law_1.01,0.12016639709472657
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,32,8,2,power_law_1.2,0.047391998767852786
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,32,8,2,balanced,0.08638933300971985
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,32,4,4,power_law_1.2,2.0955392837524416
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,32,8,2,power_law_1.01,0.1287551999092102
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,32,16,1,balanced,0.024959998826185863
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,32,8,2,power_law_1.2,0.04842880070209503
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,32,8,2,balanced,0.13796266913414001
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,32,8,2,power_law_1.01,0.1641983985900879
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,32,4,4,power_law_1.2,2.5894847869873048
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,32,8,2,power_law_1.2,0.052025598287582395
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,32,16,1,balanced,0.028933333853880566
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,32,8,2,balanced,0.14685333768526712
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,32,8,2,power_law_1.01,0.19751039743423462
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,32,8,2,power_law_1.2,0.05268480181694031
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,32,16,1,balanced,0.03196800003449122
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,32,4,4,power_law_1.2,7.164966583251953
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,32,8,2,power_law_1.01,0.2577023983001709
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,32,16,1,balanced,0.044031997521718345
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,32,8,2,power_law_1.2,0.05578240156173706
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,32,8,2,balanced,0.2111146648724874
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,32,8,2,power_law_1.01,0.3355711936950684
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,32,16,1,balanced,0.044079999128977455
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,32,8,2,power_law_1.2,0.05959039926528931
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,32,8,2,balanced,0.2530826727549235
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,32,8,2,power_law_1.01,0.4914239883422852
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,32,8,2,power_law_1.2,0.06257280111312866
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,32,16,1,balanced,0.042490666111310325
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,32,8,2,power_law_1.01,0.5795775890350342
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,32,8,2,power_law_1.2,0.06528639793395996
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,32,16,1,power_law_1.01,0.024172799289226533
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,32,8,2,balanced,0.3785173495610555
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,32,8,2,power_law_1.2,0.09255679845809936
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,32,16,1,balanced,0.04222933451334635
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,32,8,2,power_law_1.01,0.9298175811767578
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,32,8,2,power_law_1.2,0.08548480272293091
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,32,16,1,power_law_1.01,0.02736000120639801
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,32,16,1,balanced,0.04138133426507314
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,32,8,2,power_law_1.01,1.1475520133972168
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,32,8,2,power_law_1.2,0.09366400241851806
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,32,8,2,balanced,0.48230401674906415
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,32,16,1,balanced,0.04338666796684265
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,32,16,1,power_law_1.01,0.029817599058151244
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,32,8,2,power_law_1.01,1.5734527587890625
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,32,8,2,power_law_1.2,0.1226304054260254
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,32,16,1,power_law_1.01,0.0350847989320755
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,32,16,1,balanced,0.04268800218900045
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,32,8,2,power_law_1.01,2.2463872909545897
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,32,8,2,power_law_1.2,0.13175040483474731
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,32,16,1,balanced,0.0429066667954127
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,32,16,1,power_law_1.01,0.04378879964351654
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,32,16,1,power_law_1.2,0.023974399268627166
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,32,8,2,power_law_1.2,0.16507519483566285
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,32,8,2,balanced,0.7052373091379801
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,32,16,1,balanced,0.04607999821503957
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,32,8,2,power_law_1.01,4.582048034667968
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,32,16,1,power_law_1.01,0.04299519956111908
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,32,16,1,power_law_1.2,0.027244800329208375
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,32,8,2,power_law_1.2,0.19267840385437013
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,32,16,1,balanced,0.04646400113900503
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,32,16,1,power_law_1.01,0.04552960097789764
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,32,16,1,power_law_1.2,0.029471999406814574
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,32,16,1,balanced,0.048485333720842995
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,32,8,2,power_law_1.2,0.2684927940368652
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,32,16,1,power_law_1.2,0.034534400701522826
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,32,16,1,power_law_1.01,0.04848000109195709
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,32,16,1,power_law_1.2,0.043673598766326906
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,32,16,1,balanced,0.05624000231424967
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,32,8,2,power_law_1.2,0.3156735897064209
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,32,16,1,power_law_1.2,0.043219199776649474
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,32,16,1,power_law_1.01,0.04959999918937683
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,32,8,2,balanced,0.9274293581644694
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,32,16,1,balanced,0.05806933343410492
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,32,16,1,power_law_1.2,0.04801279902458191
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,32,8,2,power_law_1.2,0.4821824073791504
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,32,16,1,power_law_1.01,0.05050240159034729
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,32,16,1,power_law_1.2,0.048281601071357726
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,32,16,1,balanced,0.06073066592216492
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,32,8,2,power_law_1.2,0.7340223789215088
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,32,16,1,power_law_1.2,0.049491199851036075
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,32,16,1,power_law_1.01,0.052723199129104614
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,32,16,1,balanced,0.0942026674747467
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,32,16,1,power_law_1.2,0.05088000297546387
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,32,8,2,power_law_1.2,0.9581184387207031
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,32,16,1,power_law_1.01,0.05568640232086182
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,32,16,1,power_law_1.2,0.052908802032470705
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,32,16,1,balanced,0.09831999739011128
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,32,16,1,power_law_1.2,0.05621119737625122
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,32,16,1,power_law_1.01,0.057120001316070555
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,32,8,2,power_law_1.2,1.2666367530822753
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,32,8,2,balanced,1.147653341293335
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,32,16,1,power_law_1.2,0.056979197263717654
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,32,16,1,balanced,0.16588800152142844
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,32,16,1,power_law_1.2,0.060627198219299315
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,32,16,1,power_law_1.01,0.06059520244598389
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,32,8,2,power_law_1.2,1.5719103813171387
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,32,16,1,power_law_1.2,0.07012479901313781
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,32,16,1,balanced,0.1767253279685974
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,32,16,1,power_law_1.01,0.06970880031585694
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,32,16,1,power_law_1.2,0.07310720086097718
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,32,8,2,power_law_1.2,2.2719743728637694
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,32,16,1,power_law_1.2,0.07786880135536194
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,32,16,1,power_law_1.01,0.07326719760894776
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,32,16,1,balanced,0.25760533412297565
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,32,8,2,power_law_1.2,5.030144119262696
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,32,16,1,power_law_1.2,0.13445760011672975
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,32,16,1,power_law_1.01,0.07780479788780212
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,32,16,1,power_law_1.2,0.14669439792633057
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,32,16,1,power_law_1.2,0.19442559480667115
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,32,16,1,balanced,0.3357066710789998
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,32,16,1,power_law_1.01,0.13305599689483644
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,32,16,1,power_law_1.2,0.2216576099395752
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,32,16,1,power_law_1.01,0.1444159984588623
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,32,8,2,balanced,1.8085546493530273
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,32,16,1,power_law_1.2,0.2985536098480225
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,32,16,1,balanced,0.493125319480896
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,32,16,1,power_law_1.2,0.3776128053665161
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,32,16,1,power_law_1.01,0.19328000545501708
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,32,16,1,power_law_1.2,0.5310848236083985
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,32,16,1,power_law_1.01,0.22218239307403564
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,32,16,1,power_law_1.2,0.6821184158325195
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,32,16,1,power_law_1.01,0.29767038822174074
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,32,16,1,balanced,0.6472266515096029
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,32,16,1,power_law_1.2,0.9831744194030761
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,32,16,1,power_law_1.01,0.3748863935470581
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,32,16,1,power_law_1.2,1.2815744400024414
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,32,16,1,power_law_1.01,0.5297984123229981
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,32,16,1,power_law_1.2,1.5768063545227051
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,32,16,1,power_law_1.2,2.4766143798828124
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,32,16,1,balanced,0.9494667053222656
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,32,16,1,power_law_1.01,0.6797567844390869
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,32,16,1,power_law_1.2,4.863616180419922
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,32,16,1,power_law_1.01,0.9802432060241699
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,32,16,1,power_law_1.01,1.278559970855713
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,32,16,1,power_law_1.01,1.5707136154174806
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,32,16,1,balanced,1.2516907056172688
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,32,16,1,power_law_1.01,2.4618175506591795
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,32,16,1,power_law_1.01,4.843999862670898
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,32,8,2,balanced,3.5791200002034507
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,32,16,1,balanced,1.5513760248819988
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,4096,14336,2,8,4,8,balanced,0.056218668818473816
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,4096,14336,2,8,4,8,balanced,0.05395199855168661
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,4096,14336,2,8,4,8,balanced,0.05365866422653198
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,4096,14336,2,8,4,8,balanced,0.054469332098960876
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,4096,14336,2,8,4,8,balanced,0.05542933444182078
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,4096,14336,2,8,4,8,balanced,0.05633600056171417
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,32,16,1,balanced,2.4514613151550293
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,4096,14336,2,8,4,8,balanced,0.057189335425694786
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,4096,14336,2,8,4,8,balanced,0.05665599803129832
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,4096,14336,2,8,4,8,balanced,0.057162667314211525
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,4096,14336,2,8,4,8,balanced,0.056176001826922096
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,4096,14336,2,8,4,8,balanced,0.05955199897289276
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,4096,14336,2,8,4,8,balanced,0.05682666599750519
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,4096,14336,2,8,4,8,balanced,0.0565280020236969
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,4096,14336,2,8,4,8,balanced,0.03773866593837738
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,4096,14336,2,8,4,8,balanced,0.057578667998313904
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,4096,14336,2,8,4,8,balanced,0.039120001097520195
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,4096,14336,2,8,4,8,balanced,0.06599999964237213
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,4096,14336,2,8,4,8,balanced,0.036874666810035706
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,4096,14336,2,8,4,8,balanced,0.06702400247255962
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,4096,14336,2,8,4,8,balanced,0.0390133336186409
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,4096,14336,2,8,4,8,balanced,0.038906666139761605
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,4096,14336,2,8,4,8,balanced,0.06413866579532623
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,4096,14336,2,8,4,8,balanced,0.04019733270009359
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,4096,14336,2,8,4,8,balanced,0.08409600456555684
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,4096,14336,2,8,4,8,balanced,0.03930133332808813
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,4096,14336,2,8,4,8,balanced,0.07751466830571492
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,4096,14336,2,8,4,8,balanced,0.04009066770474116
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,32,16,1,balanced,4.844837188720703
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,4096,14336,2,8,4,8,balanced,0.042992000778516136
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,4096,14336,2,8,4,8,balanced,0.10481066505114238
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,4096,14336,2,8,4,8,balanced,0.04375466704368591
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,4096,14336,2,8,4,8,balanced,0.10514133175214131
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,4096,14336,2,8,4,8,balanced,0.04426133135954539
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,4096,14336,2,8,4,8,balanced,0.1490293343861898
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,4096,14336,2,8,4,8,balanced,0.04492799937725067
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,4096,14336,2,8,4,8,balanced,0.16831467549006143
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,4096,14336,2,8,4,8,balanced,0.046165332198143005
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,4096,14336,2,8,4,8,balanced,0.047040000557899475
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,4096,14336,2,8,4,8,balanced,0.2540000081062317
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,4096,14336,2,8,4,8,balanced,0.05638933181762695
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,4096,14336,2,8,4,8,balanced,0.05580266813437144
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,4096,14336,2,8,4,8,balanced,0.3039039969444275
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,4096,14336,2,8,4,8,balanced,0.05565333366394043
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,4096,14336,2,8,4,8,balanced,0.0687253326177597
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,4096,14336,2,8,4,8,balanced,0.43562134106953937
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,4096,14336,2,8,4,8,balanced,0.06870399912198384
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,4096,14336,2,8,4,8,balanced,0.033786666889985405
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,4096,14336,2,8,4,8,balanced,0.09485866626103719
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,4096,14336,2,8,4,8,balanced,0.5323733488718668
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,4096,14336,2,8,4,8,balanced,0.03281066566705704
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,4096,14336,2,8,4,8,balanced,0.09999466935793559
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,4096,14336,2,8,4,8,balanced,0.03324266771475474
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,4096,14336,2,8,4,8,balanced,0.035045333206653595
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,4096,14336,2,8,4,8,balanced,0.13635200262069702
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,4096,14336,2,8,4,8,balanced,0.03621866554021835
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,4096,14336,2,8,4,8,balanced,0.03562133262554804
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,4096,14336,2,8,4,8,balanced,0.6627573172251383
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,4096,14336,2,8,4,8,balanced,0.15246400237083435
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,4096,14336,2,8,4,8,balanced,0.03640000025431315
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,4096,14336,2,8,4,8,balanced,0.03566933423280716
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,4096,14336,2,8,4,8,balanced,0.21225599447886148
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,4096,14336,2,8,4,8,balanced,0.04151466737190882
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,4096,14336,2,8,4,8,balanced,0.042319998145103455
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,4096,14336,2,8,4,8,balanced,0.26813334226608276
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,4096,14336,2,8,4,8,balanced,1.0217386881510417
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,4096,14336,2,8,4,8,power_law_1.01,0.05141760110855102
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,4096,14336,2,8,4,8,balanced,0.38275734583536786
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,4096,14336,2,8,4,8,power_law_1.01,0.05286399722099304
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,4096,14336,2,8,4,8,balanced,0.038762666285037994
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,4096,14336,2,8,4,8,power_law_1.01,0.05193600058555603
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,4096,14336,2,8,4,8,balanced,0.039893334110577904
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,4096,14336,2,8,4,8,balanced,0.4790026744206746
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,4096,14336,2,8,4,8,power_law_1.01,0.05406079888343811
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,4096,14336,2,8,4,8,balanced,0.041162667175134025
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,4096,14336,2,8,4,8,balanced,0.04032533367474874
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,4096,14336,2,8,4,8,power_law_1.01,0.05437440276145935
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,4096,14336,2,8,4,8,power_law_1.01,0.05905280113220215
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,4096,14336,2,8,4,8,power_law_1.01,0.03924480080604553
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,4096,14336,2,8,4,8,balanced,2.00602134068807
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,4096,14336,2,8,4,8,power_law_1.01,0.06056320071220398
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,4096,14336,2,8,4,8,balanced,0.593946655591329
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,4096,14336,2,8,4,8,power_law_1.01,0.06027519702911377
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,4096,14336,2,8,4,8,power_law_1.01,0.039705601334571836
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,4096,14336,2,8,4,8,power_law_1.01,0.06293119788169861
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,4096,14336,2,8,4,8,power_law_1.01,0.03916800022125244
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,4096,14336,2,8,4,8,balanced,0.04939199984073639
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,4096,14336,2,8,4,8,power_law_1.01,0.06897280216217042
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,4096,14336,2,8,4,8,power_law_1.01,0.04206719994544983
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,4096,14336,2,8,4,8,balanced,0.049642667174339294
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,4096,14336,2,8,4,8,power_law_1.01,0.06929280161857605
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,4096,14336,2,8,4,8,power_law_1.01,0.0400191992521286
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,4096,14336,2,8,4,8,balanced,0.051311999559402466
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,4096,14336,2,8,4,8,balanced,0.9099520047505697
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,4096,14336,2,8,4,8,power_law_1.01,0.07309439778327942
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,4096,14336,2,8,4,8,power_law_1.01,0.04306559860706329
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,4096,14336,2,8,4,8,power_law_1.01,0.08538240194320679
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,4096,14336,2,8,4,8,power_law_1.01,0.048172798752784726
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,4096,14336,2,8,4,8,power_law_1.01,0.08150399923324585
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,4096,14336,2,8,4,8,power_law_1.01,0.047884801030159
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,4096,14336,2,8,4,8,power_law_1.2,0.05141119956970215
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,4096,14336,2,8,4,8,power_law_1.01,0.1158784031867981
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,4096,14336,2,8,4,8,power_law_1.01,0.05454720258712768
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,4096,14336,2,8,4,8,power_law_1.2,0.05256320238113403
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,4096,14336,2,8,4,8,power_law_1.01,0.11258879899978638
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,4096,14336,2,8,4,8,power_law_1.01,0.05713919997215271
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,4096,14336,2,8,4,8,power_law_1.2,0.05243520140647888
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,4096,14336,2,8,4,8,balanced,0.06117333471775055
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,4096,14336,2,8,4,8,power_law_1.01,0.12764159440994263
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,4096,14336,2,8,4,8,power_law_1.01,0.05160319805145264
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,4096,14336,2,8,4,8,power_law_1.2,0.0542527973651886
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,4096,14336,2,8,4,8,power_law_1.01,0.03200640082359314
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,4096,14336,2,8,4,8,balanced,0.06344533463319142
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,4096,14336,2,8,4,8,power_law_1.01,0.05751680135726929
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,4096,14336,2,8,4,8,power_law_1.01,0.16016639471054078
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,4096,14336,2,8,4,8,balanced,1.7710347175598145
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,4096,14336,2,8,4,8,power_law_1.2,0.0543615996837616
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,4096,14336,2,8,4,8,power_law_1.01,0.03210879862308502
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,4096,14336,2,8,4,8,power_law_1.01,0.06476799845695495
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,4096,14336,2,8,4,8,power_law_1.01,0.2090751886367798
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,4096,14336,2,8,4,8,power_law_1.2,0.059008002281188965
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,4096,14336,2,8,4,8,power_law_1.01,0.03190400004386902
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,4096,14336,2,8,4,8,power_law_1.01,0.06195840239524841
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,4096,14336,2,8,4,8,power_law_1.01,0.2919359922409058
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,4096,14336,2,8,4,8,power_law_1.2,0.06301440000534057
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,4096,14336,2,8,4,8,power_law_1.01,0.03404799997806549
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,4096,14336,2,8,4,8,power_law_1.01,0.0770367980003357
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,4096,14336,2,8,4,8,power_law_1.01,0.29523839950561526
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,4096,14336,2,8,4,8,power_law_1.2,0.060140800476074216
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,4096,14336,2,8,4,8,power_law_1.01,0.035020801424980166
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,4096,14336,2,8,4,8,power_law_1.01,0.08279680013656616
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,4096,14336,2,8,4,8,power_law_1.01,0.4361152172088623
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,4096,14336,2,8,4,8,power_law_1.2,0.06737279891967773
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,4096,14336,2,8,4,8,balanced,0.08152000109354655
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,4096,14336,2,8,4,8,power_law_1.01,0.037862399220466615
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,4096,14336,2,8,4,8,power_law_1.01,0.08630399703979492
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,4096,14336,2,8,4,8,power_law_1.01,0.509823989868164
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,4096,14336,2,8,4,8,power_law_1.2,0.07162879705429077
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,4096,14336,2,8,4,8,power_law_1.01,0.04419200122356415
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,4096,14336,2,8,4,8,power_law_1.01,0.7672768115997315
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,4096,14336,2,8,4,8,power_law_1.01,0.11090559959411621
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,4096,14336,2,8,4,8,power_law_1.2,0.06862080097198486
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,4096,14336,2,8,4,8,power_law_1.01,0.04720639884471893
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,4096,14336,2,8,4,8,power_law_1.01,0.13173760175704957
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,4096,14336,2,8,4,8,power_law_1.01,0.8987648010253906
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,4096,14336,2,8,4,8,power_law_1.2,0.07754240036010743
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,4096,14336,2,8,4,8,power_law_1.01,0.0473471999168396
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,4096,14336,2,8,4,8,balanced,0.09371733665466309
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,4096,14336,2,8,4,8,power_law_1.01,0.18225280046463013
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,4096,14336,2,8,4,8,power_law_1.2,0.08464639782905578
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,4096,14336,2,8,4,8,power_law_1.01,1.4506367683410644
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,4096,14336,2,8,4,8,power_law_1.01,0.05729280114173889
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,4096,14336,2,8,4,8,balanced,0.1306826670964559
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,4096,14336,2,8,4,8,power_law_1.2,0.08600320219993592
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,4096,14336,2,8,4,8,power_law_1.01,0.2026047945022583
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,4096,14336,2,8,4,8,power_law_1.01,1.9200704574584961
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,4096,14336,2,8,4,8,power_law_1.2,0.1014847993850708
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,4096,14336,2,8,4,8,power_law_1.01,0.30256640911102295
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,4096,14336,2,8,4,8,power_law_1.01,2.361484718322754
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,4096,14336,2,8,4,8,power_law_1.01,0.0494592010974884
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,4096,14336,2,8,4,8,power_law_1.2,0.11635839939117432
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,4096,14336,2,8,4,8,power_law_1.01,0.2986047983169556
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,4096,14336,2,8,4,8,balanced,0.1606880029042562
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,4096,14336,2,8,4,8,power_law_1.01,3.690412902832031
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,4096,14336,2,8,4,8,power_law_1.01,0.06007680296897888
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,4096,14336,2,8,4,8,power_law_1.2,0.12094719409942627
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,4096,14336,2,8,4,8,power_law_1.01,0.47307519912719725
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,4096,14336,2,8,4,8,balanced,0.22959999243418375
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,4096,14336,2,8,4,8,power_law_1.2,0.16877440214157105
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,4096,14336,2,8,4,8,power_law_1.01,0.06097919940948486
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,4096,14336,2,8,4,8,power_law_1.01,0.6162176132202148
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,4096,14336,2,8,4,8,power_law_1.01,6.806719970703125
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,4096,14336,2,8,4,8,power_law_1.01,0.0739135980606079
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,4096,14336,2,8,4,8,power_law_1.2,0.20181119441986084
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,4096,14336,2,8,4,8,power_law_1.01,0.9297408103942871
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,4096,14336,2,8,4,8,balanced,0.2845919926961263
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,4096,14336,2,8,4,8,power_law_1.2,0.03925119936466217
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,4096,14336,2,8,4,8,power_law_1.2,0.3111488103866577
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,4096,14336,2,8,4,8,power_law_1.01,1.3336192131042481
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,4096,14336,2,8,4,8,power_law_1.2,0.29506559371948243
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,4096,14336,2,8,4,8,power_law_1.01,1.6718719482421875
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,4096,14336,2,8,4,8,power_law_1.2,0.03966720104217529
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,4096,14336,2,8,4,8,power_law_1.01,0.07890560030937195
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,4096,14336,2,8,4,8,power_law_1.2,0.4329343795776367
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,4096,14336,2,8,4,8,power_law_1.01,2.481023979187012
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,4096,14336,2,8,4,8,power_law_1.2,0.03911679983139038
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,4096,14336,2,8,4,8,power_law_1.01,0.08249599933624267
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,4096,14336,2,8,4,8,balanced,0.4488106568654378
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,4096,14336,2,8,4,8,power_law_1.2,0.47996158599853517
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,4096,14336,2,8,4,8,power_law_1.2,0.04068480134010315
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,4096,14336,2,8,4,8,power_law_1.01,4.719475173950196
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,4096,14336,2,8,4,8,power_law_1.01,0.09994239807128906
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,4096,14336,2,8,4,8,power_law_1.2,0.6693696022033692
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,4096,14336,2,8,4,8,power_law_1.2,0.039987200498580934
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,4096,14336,2,8,4,8,power_law_1.2,0.92807035446167
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,4096,14336,2,8,4,8,balanced,0.5874666770299276
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,4096,14336,2,8,4,8,power_law_1.2,0.0444927990436554
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,4096,14336,2,8,4,8,power_law_1.01,0.11727360486984253
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,4096,14336,2,8,4,8,power_law_1.2,1.4136704444885253
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,4096,14336,2,8,4,8,power_law_1.2,0.049439999461174014
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,4096,14336,2,8,4,8,power_law_1.2,1.8746816635131835
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,4096,14336,2,8,4,8,power_law_1.01,0.13392640352249147
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,4096,14336,2,8,4,8,balanced,0.724730650583903
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,4096,14336,2,8,4,8,power_law_1.2,0.04766719937324524
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,4096,14336,2,8,4,8,power_law_1.2,2.3042623519897463
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,4096,14336,2,8,4,8,power_law_1.2,0.05271040201187134
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,4096,14336,2,8,4,8,power_law_1.2,0.05896959900856018
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,4096,14336,2,8,4,8,power_law_1.2,3.765043258666992
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,4096,14336,2,8,4,8,power_law_1.01,0.2172991991043091
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,4096,14336,2,8,4,8,balanced,1.1476693153381348
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,4096,14336,2,8,4,8,power_law_1.2,0.05136640071868896
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,4096,14336,2,8,4,8,power_law_1.2,7.220877075195313
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,4096,14336,2,8,4,8,power_law_1.01,0.25240321159362794
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,4096,14336,2,8,4,8,power_law_1.2,0.06228479743003845
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,4096,14336,2,8,4,8,power_law_1.01,0.42770562171936033
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,4096,14336,2,8,4,8,power_law_1.2,0.06475520133972168
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,4096,14336,2,8,4,8,power_law_1.2,0.06236799955368042
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,4096,14336,2,8,4,8,power_law_1.01,0.5297215938568115
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,4096,14336,2,8,4,8,power_law_1.2,0.07564799785614014
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,4096,14336,2,8,4,8,power_law_1.01,0.7957632064819335
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,4096,14336,2,8,4,8,power_law_1.2,0.08406400084495544
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,4096,14336,2,8,4,8,balanced,2.2409226099650064
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,4096,14336,2,8,4,8,power_law_1.2,0.08662400245666504
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,4096,14336,2,8,4,8,power_law_1.01,1.030835247039795
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,4096,14336,2,8,4,8,power_law_1.2,0.11842559576034546
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,4096,14336,2,8,4,8,power_law_1.2,0.13463679552078248
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,4096,14336,2,8,4,8,power_law_1.01,1.6368768692016602
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,4096,14336,2,8,4,8,power_law_1.2,0.1761664032936096
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,4096,14336,2,8,4,8,power_law_1.01,2.006483268737793
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,4096,14336,2,8,4,8,power_law_1.2,0.2158207893371582
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,4096,14336,2,8,4,8,power_law_1.01,2.3265216827392576
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,4096,14336,2,8,4,8,power_law_1.2,0.3142143964767456
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,4096,14336,2,8,4,8,power_law_1.01,3.91541748046875
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,4096,14336,2,8,4,8,power_law_1.2,0.3535871982574463
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,4096,14336,2,8,4,8,power_law_1.2,0.511513614654541
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,4096,14336,2,8,4,8,power_law_1.01,7.736672210693359
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,4096,14336,2,8,4,8,power_law_1.2,0.6730559825897217
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,4096,14336,2,8,4,8,power_law_1.2,0.9925696372985839
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,4096,14336,2,8,4,8,power_law_1.2,1.3677568435668945
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,4096,14336,2,8,4,8,power_law_1.2,1.6633087158203126
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,4096,14336,2,8,4,8,power_law_1.2,0.031974399089813234
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,4096,14336,2,8,4,8,power_law_1.2,2.312339210510254
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,4096,14336,2,8,4,8,power_law_1.2,0.03198719918727875
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,4096,14336,2,8,4,8,power_law_1.2,0.032179200649261476
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,4096,14336,2,8,4,8,power_law_1.2,4.612486267089844
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,4096,14336,2,8,4,8,power_law_1.2,0.03480960130691528
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,4096,14336,2,8,4,8,power_law_1.2,0.03518719971179962
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,4096,14336,2,8,4,8,power_law_1.2,0.03776639997959137
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,4096,14336,2,8,4,8,power_law_1.2,0.04547840058803558
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,4096,14336,2,8,4,8,power_law_1.2,0.04726400077342987
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,4096,14336,2,8,4,8,power_law_1.2,0.04733439981937408
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,4096,14336,2,8,4,8,power_law_1.2,0.05478399991989136
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,4096,14336,2,8,8,4,balanced,0.04273599882920583
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,4096,14336,2,8,8,4,balanced,0.04098666707674662
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,4096,14336,2,8,8,4,balanced,0.04993600149949392
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,4096,14336,2,8,4,8,power_law_1.2,0.05308160185813904
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,4096,14336,2,8,8,4,balanced,0.052576000491778054
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,4096,14336,2,8,4,8,power_law_1.2,0.06230400204658508
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,4096,14336,2,8,8,4,balanced,0.05309333403905233
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,4096,14336,2,8,4,8,power_law_1.2,0.06470400094985962
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,4096,14336,2,8,8,4,balanced,0.05434666574001312
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,4096,14336,2,8,4,8,power_law_1.2,0.08106240034103393
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,4096,14336,2,8,8,4,balanced,0.05407466491063436
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,4096,14336,2,8,8,4,balanced,0.0528053343296051
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,4096,14336,2,8,4,8,power_law_1.2,0.08141440153121948
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,4096,14336,2,8,8,4,balanced,0.05472533404827118
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,4096,14336,2,8,4,8,power_law_1.2,0.0871616005897522
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,4096,14336,2,8,8,4,balanced,0.054431999723116554
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,4096,14336,2,8,4,8,power_law_1.2,0.10360959768295289
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,4096,14336,2,8,8,4,balanced,0.054330666859944664
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,4096,14336,2,8,8,4,balanced,0.05691199998060862
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,4096,14336,2,8,8,4,balanced,0.05684266487757365
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,4096,14336,2,8,4,8,power_law_1.2,0.11969280242919922
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,4096,14336,2,8,8,4,balanced,0.056128000219662987
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,4096,14336,2,8,8,4,balanced,0.037077332536379494
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,4096,14336,2,8,4,8,power_law_1.2,0.1483456015586853
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,4096,14336,2,8,8,4,balanced,0.06800533334414165
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,4096,14336,2,8,8,4,balanced,0.035674666364987694
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,4096,14336,2,8,8,4,balanced,0.0681386689345042
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,4096,14336,2,8,4,8,power_law_1.2,0.22172160148620607
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,4096,14336,2,8,8,4,balanced,0.036837334434191384
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,4096,14336,2,8,8,4,balanced,0.06448000172773997
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,4096,14336,2,8,8,4,balanced,0.03900266687075297
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,4096,14336,2,8,8,4,balanced,0.08016000191370647
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,4096,14336,2,8,4,8,power_law_1.2,0.2595839977264404
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,4096,14336,2,8,8,4,balanced,0.03898133337497711
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,4096,14336,2,8,8,4,balanced,0.08653866251309712
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,4096,14336,2,8,4,8,power_law_1.2,0.42478079795837403
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,4096,14336,2,8,8,4,balanced,0.039306665460268654
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,4096,14336,2,8,8,4,balanced,0.10345600048700969
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,4096,14336,2,8,8,4,balanced,0.03986666599909464
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,4096,14336,2,8,4,8,power_law_1.2,0.4995391845703125
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,4096,14336,2,8,8,4,balanced,0.1090880036354065
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,4096,14336,2,8,8,4,balanced,0.03941866755485535
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,4096,14336,2,8,4,8,power_law_1.2,0.7940032005310058
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,4096,14336,2,8,8,4,balanced,0.16648000478744507
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,4096,14336,2,8,8,4,balanced,0.04562133550643921
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,4096,14336,2,8,4,8,power_law_1.2,1.0610367774963378
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,4096,14336,2,8,8,4,balanced,0.0459199994802475
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,4096,14336,2,8,8,4,balanced,0.18154666821161905
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,4096,14336,2,8,8,4,balanced,0.042624001701672874
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,4096,14336,2,8,4,8,power_law_1.2,1.6160255432128907
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,4096,14336,2,8,8,4,balanced,0.04715733230113983
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,4096,14336,2,8,8,4,balanced,0.25330666700998944
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,4096,14336,2,8,4,8,power_law_1.2,2.071641540527344
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,4096,14336,2,8,8,4,balanced,0.04833066463470459
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,4096,14336,2,8,4,8,power_law_1.2,2.5693952560424806
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,4096,14336,2,8,8,4,balanced,0.04785599807898203
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,4096,14336,2,8,8,4,balanced,0.32475733757019043
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,4096,14336,2,8,8,4,power_law_1.01,0.04578559994697571
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,4096,14336,2,8,8,4,balanced,0.02719466636578242
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,4096,14336,2,8,8,4,balanced,0.05646933118502299
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,4096,14336,2,8,4,8,power_law_1.2,4.089433670043945
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,4096,14336,2,8,8,4,power_law_1.01,0.048179200291633605
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,4096,14336,2,8,8,4,balanced,0.027232001225153606
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,4096,14336,2,8,8,4,balanced,0.05625600119431814
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,4096,14336,2,8,8,4,balanced,0.4694133202234904
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,4096,14336,2,8,8,4,power_law_1.01,0.04836480021476745
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,4096,14336,2,8,4,8,power_law_1.2,8.119213104248047
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,4096,14336,2,8,8,4,balanced,0.029872000217437744
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,4096,14336,2,8,8,4,balanced,0.056741332014401756
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,4096,14336,2,8,8,4,power_law_1.01,0.052288001775741576
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,4096,14336,2,8,8,4,balanced,0.032127998769283295
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,4096,14336,2,8,8,4,balanced,0.06937600175539653
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,4096,14336,2,8,8,4,power_law_1.01,0.0525439977645874
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,4096,14336,2,8,8,4,balanced,0.579525351524353
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,4096,14336,2,8,8,4,balanced,0.03238933285077413
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,4096,14336,2,8,8,4,balanced,0.07666666805744171
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,4096,14336,2,8,8,4,power_law_1.01,0.05370879769325256
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,4096,14336,2,8,8,4,balanced,0.032826667030652366
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,4096,14336,2,8,8,4,balanced,0.09021866321563721
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,4096,14336,2,8,8,4,power_law_1.01,0.05731840133666992
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,4096,14336,2,8,8,4,balanced,0.03443199892838796
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,4096,14336,2,8,8,4,power_law_1.01,0.03861759901046753
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,4096,14336,2,8,8,4,balanced,0.729856014251709
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,4096,14336,2,8,8,4,power_law_1.01,0.0571008026599884
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,4096,14336,2,8,8,4,balanced,0.10097066561381023
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,4096,14336,2,8,8,4,balanced,0.03364266703526179
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,4096,14336,2,8,8,4,power_law_1.01,0.0377023994922638
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,4096,14336,2,8,8,4,power_law_1.01,0.06020479798316956
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,4096,14336,2,8,8,4,balanced,0.04252266883850098
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,4096,14336,2,8,8,4,balanced,0.14453333616256714
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,4096,14336,2,8,8,4,power_law_1.01,0.035724800825119016
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,4096,14336,2,8,8,4,power_law_1.01,0.06509439945220948
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,4096,14336,2,8,8,4,balanced,0.043290664752324425
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,4096,14336,2,8,8,4,power_law_1.01,0.037913599610328676
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,4096,14336,2,8,8,4,balanced,0.16582399606704712
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,4096,14336,2,8,8,4,power_law_1.01,0.062463998794555664
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,4096,14336,2,8,8,4,power_law_1.01,0.03790720105171204
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,4096,14336,2,8,8,4,balanced,1.148255983988444
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,4096,14336,2,8,8,4,power_law_1.01,0.06721280217170715
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,4096,14336,2,8,8,4,balanced,0.23298666874567667
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,4096,14336,2,8,8,4,power_law_1.01,0.04158720076084137
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,4096,14336,2,8,8,4,power_law_1.01,0.066348797082901
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,4096,14336,2,8,8,4,power_law_1.01,0.04323199987411499
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,4096,14336,2,8,8,4,balanced,0.29212266206741333
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,4096,14336,2,8,8,4,power_law_1.01,0.07587199807167053
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,4096,14336,2,8,8,4,power_law_1.01,0.04936319887638092
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,4096,14336,2,8,8,4,power_law_1.01,0.08329600095748901
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,4096,14336,2,8,8,4,power_law_1.01,0.051648002862930295
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,4096,14336,2,8,8,4,balanced,0.037418665985266365
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,4096,14336,2,8,8,4,power_law_1.01,0.09246079921722412
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,4096,14336,2,8,8,4,balanced,0.4240853389104207
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,4096,14336,2,8,8,4,power_law_1.01,0.05429120063781738
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,4096,14336,2,8,8,4,balanced,0.039221333960692085
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,4096,14336,2,8,8,4,power_law_1.01,0.028697600960731505
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,4096,14336,2,8,8,4,power_law_1.01,0.10223360061645508
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,4096,14336,2,8,8,4,power_law_1.01,0.050432002544403075
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,4096,14336,2,8,8,4,balanced,0.04071466624736786
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,4096,14336,2,8,8,4,power_law_1.01,0.028332799673080444
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,4096,14336,2,8,8,4,power_law_1.01,0.13415679931640626
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,4096,14336,2,8,8,4,power_law_1.01,0.05187839865684509
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,4096,14336,2,8,8,4,power_law_1.01,0.02876800000667572
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,4096,14336,2,8,8,4,balanced,0.040106666584809623
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,4096,14336,2,8,8,4,balanced,0.5362079938252767
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,4096,14336,2,8,8,4,balanced,2.1838186581929526
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,4096,14336,2,8,8,4,power_law_1.01,0.05751680135726929
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,4096,14336,2,8,8,4,power_law_1.01,0.14126720428466796
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,4096,14336,2,8,8,4,power_law_1.01,0.032767999172210696
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,4096,14336,2,8,8,4,power_law_1.01,0.03299199938774109
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,4096,14336,2,8,8,4,power_law_1.01,0.059411197900772095
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,4096,14336,2,8,8,4,power_law_1.01,0.20915839672088624
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,4096,14336,2,8,8,4,power_law_1.2,0.04216319918632507
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,4096,14336,2,8,8,4,power_law_1.01,0.03637759983539581
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,4096,14336,2,8,8,4,power_law_1.01,0.06538239717483521
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,4096,14336,2,8,8,4,power_law_1.01,0.23486080169677734
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,4096,14336,2,8,8,4,power_law_1.01,0.03945600092411041
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,4096,14336,2,8,8,4,balanced,0.6616693337758383
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,4096,14336,2,8,8,4,power_law_1.2,0.04819200038909912
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,4096,14336,2,8,8,4,power_law_1.01,0.043372800946235655
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,4096,14336,2,8,8,4,power_law_1.01,0.07182719707489013
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,4096,14336,2,8,8,4,power_law_1.01,0.3392191886901855
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,4096,14336,2,8,8,4,power_law_1.01,0.050380802154541014
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,4096,14336,2,8,8,4,power_law_1.2,0.05072640180587769
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,4096,14336,2,8,8,4,power_law_1.01,0.07096959948539734
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,4096,14336,2,8,8,4,power_law_1.01,0.05190399885177612
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,4096,14336,2,8,8,4,power_law_1.01,0.3634943962097168
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,4096,14336,2,8,8,4,power_law_1.2,0.05284479856491089
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,4096,14336,2,8,8,4,power_law_1.01,0.09025279879570007
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,4096,14336,2,8,8,4,balanced,0.04961599906285604
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,4096,14336,2,8,8,4,power_law_1.01,0.5236608028411865
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,4096,14336,2,8,8,4,power_law_1.01,0.11570559740066529
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,4096,14336,2,8,8,4,power_law_1.2,0.05292159914970398
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,4096,14336,2,8,8,4,power_law_1.01,0.05018240213394165
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,4096,14336,2,8,8,4,balanced,0.05101866523424784
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,4096,14336,2,8,8,4,power_law_1.01,0.7462016105651855
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,4096,14336,2,8,8,4,balanced,1.0381440321604412
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,4096,14336,2,8,8,4,power_law_1.01,0.14856959581375123
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,4096,14336,2,8,8,4,power_law_1.01,0.05367040038108826
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,4096,14336,2,8,8,4,power_law_1.2,0.05418239831924439
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,4096,14336,2,8,8,4,balanced,0.05296533306439718
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,4096,14336,2,8,8,4,power_law_1.01,0.9456319808959961
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,4096,14336,2,8,8,4,power_law_1.01,0.05241600275039673
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,4096,14336,2,8,8,4,power_law_1.01,0.17964160442352295
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,4096,14336,2,8,8,4,power_law_1.2,0.058271998167037965
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,4096,14336,2,8,8,4,power_law_1.01,0.06257280111312866
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,4096,14336,2,8,8,4,power_law_1.01,1.651852798461914
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,4096,14336,2,8,8,4,power_law_1.01,0.21793920993804933
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,4096,14336,2,8,8,4,power_law_1.2,0.059513598680496216
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,4096,14336,2,8,8,4,power_law_1.01,1.7063104629516601
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,4096,14336,2,8,8,4,power_law_1.01,0.2641855955123901
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,4096,14336,2,8,8,4,power_law_1.2,0.05788159966468811
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,4096,14336,2,8,8,4,power_law_1.01,0.0694208025932312
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,4096,14336,2,8,8,4,power_law_1.01,0.38127999305725097
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,4096,14336,2,8,8,4,balanced,0.06474666794141133
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,4096,14336,2,8,8,4,power_law_1.01,0.07480319738388061
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,4096,14336,2,8,8,4,power_law_1.01,3.277177429199219
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,4096,14336,2,8,8,4,power_law_1.2,0.06793599724769592
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,4096,14336,2,8,8,4,power_law_1.01,0.08631680011749268
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,4096,14336,2,8,8,4,power_law_1.01,0.5887872219085694
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,4096,14336,2,8,8,4,balanced,0.0692799985408783
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,4096,14336,2,8,8,4,power_law_1.2,0.06355199813842774
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,4096,14336,2,8,8,4,power_law_1.01,6.851507568359375
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,4096,14336,2,8,8,4,balanced,1.9854933420817058
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,4096,14336,2,8,8,4,power_law_1.01,0.9204031944274902
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,4096,14336,2,8,8,4,power_law_1.01,0.0958400011062622
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,4096,14336,2,8,8,4,power_law_1.2,0.06479359865188598
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,4096,14336,2,8,8,4,power_law_1.01,0.12933759689331054
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,4096,14336,2,8,8,4,power_law_1.01,0.8870271682739258
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,4096,14336,2,8,8,4,power_law_1.2,0.07626879811286927
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,4096,14336,2,8,8,4,power_law_1.01,1.3872447967529298
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,4096,14336,2,8,8,4,power_law_1.2,0.07925119996070862
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,4096,14336,2,8,8,4,power_law_1.01,2.026803207397461
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,4096,14336,2,8,8,4,power_law_1.2,0.09088000059127807
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,4096,14336,2,8,8,4,balanced,0.09222933650016785
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,4096,14336,2,8,8,4,power_law_1.2,0.09571840167045594
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,4096,14336,2,8,8,4,power_law_1.01,0.19756159782409669
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,4096,14336,2,8,8,4,power_law_1.01,4.832416152954101
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,4096,14336,2,8,8,4,power_law_1.01,0.27952640056610106
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,4096,14336,2,8,8,4,power_law_1.2,0.09108480215072631
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,4096,14336,2,8,8,4,balanced,0.10846400260925293
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,4096,14336,2,8,8,4,power_law_1.01,0.32934401035308836
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,4096,14336,2,8,8,4,power_law_1.2,0.16199040412902832
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,4096,14336,2,8,8,4,power_law_1.01,0.40307841300964353
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,4096,14336,2,8,8,4,balanced,0.1490239997704824
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,4096,14336,2,8,8,4,power_law_1.01,0.668671989440918
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,4096,14336,2,8,8,4,power_law_1.2,0.1523200035095215
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,4096,14336,2,8,8,4,balanced,0.18942399819691977
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,4096,14336,2,8,8,4,power_law_1.01,0.8994367599487305
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,4096,14336,2,8,8,4,power_law_1.2,0.2186880111694336
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,4096,14336,2,8,8,4,balanced,0.280949334303538
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,4096,14336,2,8,8,4,power_law_1.2,0.2377471923828125
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,4096,14336,2,8,8,4,power_law_1.2,0.35865600109100343
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,4096,14336,2,8,8,4,balanced,0.37112534046173096
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,4096,14336,2,8,8,4,power_law_1.01,1.3338239669799805
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,4096,14336,2,8,8,4,power_law_1.2,0.3778752088546753
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,4096,14336,2,8,8,4,power_law_1.01,1.9302719116210938
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,4096,14336,2,8,8,4,power_law_1.2,0.6520256042480469
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,4096,14336,2,8,8,4,power_law_1.01,2.248057556152344
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,4096,14336,2,8,8,4,power_law_1.2,0.7440512180328369
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,4096,14336,2,8,8,4,power_law_1.01,3.740576171875
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,4096,14336,2,8,8,4,balanced,0.5664693514506022
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,4096,14336,2,8,8,4,power_law_1.2,1.0075712203979492
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,4096,14336,2,8,8,4,power_law_1.01,7.295053100585937
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,4096,14336,2,8,8,4,power_law_1.2,1.732262420654297
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,4096,14336,2,8,8,4,balanced,0.7413919766743978
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,4096,14336,2,8,8,4,power_law_1.2,2.0755584716796873
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,4096,14336,2,8,8,4,power_law_1.2,3.3849281311035155
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,4096,14336,2,8,8,4,balanced,0.9184532960255941
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,4096,14336,2,8,8,4,power_law_1.2,4.734912109375
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,4096,14336,2,8,8,4,balanced,1.4505707422892253
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,4096,14336,2,8,8,4,power_law_1.2,0.04074240028858185
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,4096,14336,2,8,8,4,balanced,2.8706080118815103
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,4096,14336,2,8,8,4,power_law_1.2,0.0385343998670578
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,4096,14336,2,8,8,4,power_law_1.2,0.03682560026645661
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,4096,14336,2,8,8,4,power_law_1.2,0.03809280097484589
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,4096,14336,2,8,8,4,power_law_1.2,0.03790079951286316
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,4096,14336,2,8,8,4,power_law_1.2,0.041510400176048276
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,4096,14336,2,8,8,4,power_law_1.2,0.04476799964904785
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,4096,14336,2,8,8,4,power_law_1.2,0.05087360143661499
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,4096,14336,2,8,8,4,power_law_1.2,0.05100160241127014
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,4096,14336,2,8,8,4,power_law_1.2,0.05296639800071716
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,4096,14336,2,8,8,4,power_law_1.2,0.05268480181694031
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,4096,14336,2,8,8,4,power_law_1.2,0.056358402967453
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,4096,14336,2,8,8,4,power_law_1.2,0.05898879766464234
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,4096,14336,2,8,8,4,power_law_1.2,0.0611840009689331
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,4096,14336,2,8,8,4,power_law_1.2,0.06485120058059693
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,4096,14336,2,8,8,4,power_law_1.2,0.07360000014305115
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,4096,14336,2,8,8,4,power_law_1.2,0.07875199913978577
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,4096,14336,2,8,8,4,power_law_1.2,0.029292801022529603
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,4096,14336,2,8,8,4,power_law_1.2,0.09191039800643921
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,4096,14336,2,8,8,4,power_law_1.2,0.028409600257873535
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,4096,14336,2,8,8,4,power_law_1.2,0.10962560176849365
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,4096,14336,2,8,8,4,power_law_1.2,0.028870400786399842
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,4096,14336,2,8,8,4,power_law_1.2,0.14932479858398437
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,4096,14336,2,8,8,4,power_law_1.2,0.031692799925804135
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,4096,14336,2,8,8,4,power_law_1.2,0.2012160062789917
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,4096,14336,2,8,8,4,power_law_1.2,0.03182719945907593
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,4096,14336,2,8,8,4,power_law_1.2,0.28866560459136964
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,4096,14336,2,8,8,4,power_law_1.2,0.035097599029541016
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,4096,14336,2,8,8,4,power_law_1.2,0.29820799827575684
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,4096,14336,2,8,8,4,power_law_1.2,0.04172160029411316
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,4096,14336,2,8,8,4,power_law_1.2,0.4253695964813232
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,4096,14336,2,8,8,4,power_law_1.2,0.04589439928531647
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,4096,14336,2,8,8,4,power_law_1.2,0.643558406829834
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,4096,14336,2,8,8,4,power_law_1.2,0.050361597537994386
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,4096,14336,2,8,16,2,balanced,0.032170665760835014
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,4096,14336,2,8,16,2,balanced,0.03190933416287104
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,4096,14336,2,8,8,4,power_law_1.2,0.05066879987716675
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,4096,14336,2,8,8,4,power_law_1.2,0.9233599662780761
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,4096,14336,2,8,16,2,balanced,0.03400533397992452
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,4096,14336,2,8,8,4,power_law_1.2,1.093996810913086
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,4096,14336,2,8,16,2,balanced,0.03794133414824804
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,4096,14336,2,8,16,2,balanced,0.03643200049797694
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,4096,14336,2,8,16,2,balanced,0.04814933240413666
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,4096,14336,2,8,8,4,power_law_1.2,1.5258560180664062
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,4096,14336,2,8,8,4,power_law_1.2,0.05167999863624573
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,4096,14336,2,8,16,2,balanced,0.038986665507157646
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,4096,14336,2,8,16,2,balanced,0.051125332713127136
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,4096,14336,2,8,8,4,power_law_1.2,2.3450496673583983
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,4096,14336,2,8,8,4,power_law_1.2,0.051558399200439455
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,4096,14336,2,8,16,2,balanced,0.03834133346875509
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,4096,14336,2,8,16,2,balanced,0.05070933202902476
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,4096,14336,2,8,8,4,power_law_1.2,0.056704002618789676
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,4096,14336,2,8,8,4,power_law_1.2,5.40129280090332
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,4096,14336,2,8,16,2,balanced,0.05287466446558634
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,4096,14336,2,8,16,2,balanced,0.038362666964530945
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,4096,14336,2,8,8,4,power_law_1.2,0.06782720088958741
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,4096,14336,2,8,16,2,balanced,0.05264000097910563
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,4096,14336,2,8,16,2,balanced,0.03915733347336451
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,4096,14336,2,8,16,2,balanced,0.05274133384227753
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,4096,14336,2,8,16,2,balanced,0.0393653338154157
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,4096,14336,2,8,16,2,balanced,0.053157334526379905
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,4096,14336,2,8,8,4,power_law_1.2,0.07671679854393006
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,4096,14336,2,8,16,2,balanced,0.04384533564249674
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,4096,14336,2,8,16,2,balanced,0.05277333160241445
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,4096,14336,2,8,16,2,balanced,0.04491733511288961
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,4096,14336,2,8,8,4,power_law_1.2,0.07061120271682739
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,4096,14336,2,8,16,2,balanced,0.042437334855397545
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,4096,14336,2,8,16,2,balanced,0.05518933137257894
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,4096,14336,2,8,8,4,power_law_1.2,0.09043200016021728
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,4096,14336,2,8,16,2,balanced,0.0470773329337438
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,4096,14336,2,8,16,2,balanced,0.05629866818586985
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,4096,14336,2,8,8,4,power_law_1.2,0.11271040439605713
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,4096,14336,2,8,16,2,balanced,0.047685335079828896
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,4096,14336,2,8,16,2,balanced,0.055861334005991616
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,4096,14336,2,8,8,4,power_law_1.2,0.1386944055557251
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,4096,14336,2,8,16,2,balanced,0.0460746685663859
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,4096,14336,2,8,16,2,balanced,0.05774933099746704
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,4096,14336,2,8,16,2,balanced,0.026074667771657307
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,4096,14336,2,8,16,2,power_law_1.01,0.038796800374984744
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,4096,14336,2,8,16,2,balanced,0.05952533086140951
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,4096,14336,2,8,16,2,balanced,0.06663999954859416
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,4096,14336,2,8,16,2,balanced,0.026762666801611584
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,4096,14336,2,8,16,2,power_law_1.01,0.03797760009765625
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,4096,14336,2,8,16,2,balanced,0.05866133173306783
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,4096,14336,2,8,16,2,balanced,0.029909332593282063
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,4096,14336,2,8,16,2,balanced,0.06655466556549072
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,4096,14336,2,8,8,4,power_law_1.2,0.21201279163360595
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,4096,14336,2,8,16,2,power_law_1.01,0.0398144006729126
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,4096,14336,2,8,16,2,balanced,0.03203733265399933
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,4096,14336,2,8,16,2,balanced,0.06067200005054474
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,4096,14336,2,8,16,2,balanced,0.0674773355325063
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,4096,14336,2,8,8,4,power_law_1.2,0.26679039001464844
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,4096,14336,2,8,16,2,balanced,0.032655999064445496
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,4096,14336,2,8,16,2,power_law_1.01,0.05051519870758057
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,4096,14336,2,8,16,2,balanced,0.07198399802049
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,4096,14336,2,8,8,4,power_law_1.2,0.43530879020690916
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,4096,14336,2,8,16,2,balanced,0.08122133215268452
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,4096,14336,2,8,16,2,balanced,0.033471999069054924
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,4096,14336,2,8,16,2,power_law_1.01,0.051551997661590576
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,4096,14336,2,8,16,2,balanced,0.07950399816036224
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,4096,14336,2,8,16,2,balanced,0.034586665530999504
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,4096,14336,2,8,8,4,power_law_1.2,0.46153597831726073
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,4096,14336,2,8,16,2,power_law_1.01,0.05434240102767944
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,4096,14336,2,8,16,2,balanced,0.08559466401735942
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,4096,14336,2,8,16,2,power_law_1.01,0.033471998572349546
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,4096,14336,2,8,16,2,balanced,0.034186666210492454
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,4096,14336,2,8,16,2,balanced,0.10116266210873921
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,4096,14336,2,8,8,4,power_law_1.2,0.8051456451416016
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,4096,14336,2,8,16,2,power_law_1.01,0.05445759892463684
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,4096,14336,2,8,16,2,balanced,0.11174399654070537
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,4096,14336,2,8,16,2,power_law_1.01,0.034406399726867674
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,4096,14336,2,8,8,4,power_law_1.2,0.8876799583435059
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,4096,14336,2,8,16,2,balanced,0.11090667049090068
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,4096,14336,2,8,16,2,power_law_1.01,0.0554751992225647
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,4096,14336,2,8,16,2,balanced,0.12190933028856914
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,4096,14336,2,8,16,2,power_law_1.01,0.0341376006603241
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,4096,14336,2,8,16,2,power_law_1.01,0.055622398853302
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,4096,14336,2,8,16,2,balanced,0.0395413339138031
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,4096,14336,2,8,16,2,balanced,0.16119999686876932
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,4096,14336,2,8,16,2,balanced,0.1848906675974528
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,4096,14336,2,8,16,2,power_law_1.01,0.037510401010513304
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,4096,14336,2,8,8,4,power_law_1.2,1.4211584091186524
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,4096,14336,2,8,16,2,power_law_1.01,0.05737599730491638
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,4096,14336,2,8,16,2,balanced,0.040021332601706185
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,4096,14336,2,8,16,2,balanced,0.1941866676012675
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,4096,14336,2,8,16,2,power_law_1.01,0.03710080087184906
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,4096,14336,2,8,16,2,balanced,0.20398932695388794
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,4096,14336,2,8,16,2,power_law_1.01,0.058815997838973996
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,4096,14336,2,8,8,4,power_law_1.2,2.1533632278442383
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,4096,14336,2,8,16,2,power_law_1.01,0.043270400166511534
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,4096,14336,2,8,16,2,power_law_1.01,0.060787200927734375
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,4096,14336,2,8,16,2,balanced,0.2781920035680135
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,4096,14336,2,8,8,4,power_law_1.2,2.563532829284668
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,4096,14336,2,8,16,2,balanced,0.2917226751645406
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,4096,14336,2,8,16,2,power_law_1.01,0.0434112012386322
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,4096,14336,2,8,16,2,power_law_1.01,0.061318397521972656
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,4096,14336,2,8,8,4,power_law_1.2,3.956403350830078
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,4096,14336,2,8,16,2,power_law_1.01,0.04371840059757233
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,4096,14336,2,8,16,2,balanced,0.3595946629842122
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,4096,14336,2,8,16,2,power_law_1.01,0.07406079769134521
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,4096,14336,2,8,16,2,balanced,0.3741439978281657
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,4096,14336,2,8,16,2,power_law_1.01,0.04656000137329101
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,4096,14336,2,8,16,2,power_law_1.01,0.07986559867858886
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,4096,14336,2,8,16,2,balanced,0.04004266609748205
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,4096,14336,2,8,8,4,power_law_1.2,8.998381042480469
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,4096,14336,2,8,16,2,power_law_1.01,0.05004799962043762
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,4096,14336,2,8,16,2,power_law_1.01,0.0278656005859375
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,4096,14336,2,8,16,2,power_law_1.01,0.09199360013008118
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,4096,14336,2,8,16,2,balanced,0.5201333363850912
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,4096,14336,2,8,16,2,balanced,0.04260799785455068
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,4096,14336,2,8,16,2,balanced,0.5456746816635132
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,4096,14336,2,8,16,2,power_law_1.01,0.04709759950637817
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,4096,14336,2,8,16,2,power_law_1.01,0.09236479997634887
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,4096,14336,2,8,16,2,power_law_1.01,0.027116799354553224
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,4096,14336,2,8,16,2,balanced,0.04432533184687296
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,4096,14336,2,8,16,2,power_law_1.01,0.1035647988319397
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,4096,14336,2,8,16,2,power_law_1.01,0.05416319966316223
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,4096,14336,2,8,16,2,power_law_1.01,0.027724799513816834
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,4096,14336,2,8,16,2,balanced,0.04555733501911163
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,4096,14336,2,8,16,2,balanced,0.6497866710027059
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,4096,14336,2,8,16,2,power_law_1.01,0.055340802669525145
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,4096,14336,2,8,16,2,power_law_1.01,0.1266816020011902
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,4096,14336,2,8,16,2,balanced,0.6808106899261475
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,4096,14336,2,8,16,2,power_law_1.01,0.03368319869041443
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,4096,14336,2,8,16,2,power_law_1.01,0.15883519649505615
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,4096,14336,2,8,16,2,power_law_1.01,0.0579584002494812
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,4096,14336,2,8,16,2,power_law_1.01,0.033081600069999696
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,4096,14336,2,8,16,2,power_law_1.01,0.1785599946975708
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,4096,14336,2,8,16,2,power_law_1.01,0.06457599997520447
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,4096,14336,2,8,16,2,balanced,0.8047146797180176
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,4096,14336,2,8,16,2,power_law_1.01,0.03694719970226288
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,4096,14336,2,8,16,2,balanced,0.055306668082873024
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,4096,14336,2,8,16,2,balanced,0.8478826681772867
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,4096,14336,2,8,16,2,power_law_1.01,0.06867200136184692
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,4096,14336,2,8,16,2,power_law_1.01,0.2796031951904297
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,4096,14336,2,8,16,2,power_law_1.01,0.039878401160240176
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,4096,14336,2,8,16,2,balanced,0.056362668673197426
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,4096,14336,2,8,16,2,power_law_1.01,0.0720192015171051
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,4096,14336,2,8,16,2,power_law_1.01,0.24072320461273194
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,4096,14336,2,8,16,2,power_law_1.01,0.040915200114250184
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,4096,14336,2,8,16,2,balanced,0.0609386662642161
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,4096,14336,2,8,16,2,power_law_1.01,0.08487039804458618
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,4096,14336,2,8,16,2,power_law_1.01,0.3749248027801514
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,4096,14336,2,8,16,2,power_law_1.01,0.10268800258636475
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,4096,14336,2,8,16,2,power_law_1.01,0.5059199810028077
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,4096,14336,2,8,16,2,balanced,1.2621013323465984
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,4096,14336,2,8,16,2,power_law_1.01,0.045023998618125914
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,4096,14336,2,8,16,2,balanced,1.3380106290181477
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,4096,14336,2,8,16,2,power_law_1.01,0.1310528039932251
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,4096,14336,2,8,16,2,power_law_1.01,0.7569727897644043
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,4096,14336,2,8,16,2,power_law_1.01,0.04730879962444305
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,4096,14336,2,8,16,2,power_law_1.01,0.15199359655380248
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,4096,14336,2,8,16,2,power_law_1.01,1.0530176162719727
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,4096,14336,2,8,16,2,balanced,0.07687999804814656
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,4096,14336,2,8,16,2,power_law_1.01,0.211244797706604
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,4096,14336,2,8,16,2,power_law_1.01,1.2760704040527344
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,4096,14336,2,8,16,2,balanced,0.08363200227419536
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,4096,14336,2,8,16,2,power_law_1.01,0.2591423988342285
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,4096,14336,2,8,16,2,power_law_1.01,0.05069440007209778
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,4096,14336,2,8,16,2,power_law_1.01,2.1071807861328127
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,4096,14336,2,8,16,2,power_law_1.01,0.3806272029876709
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,4096,14336,2,8,16,2,power_law_1.01,0.053958398103713986
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,4096,14336,2,8,16,2,power_law_1.01,0.49683198928833006
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,4096,14336,2,8,16,2,power_law_1.01,3.366099166870117
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,4096,14336,2,8,16,2,power_law_1.01,0.05297279953956604
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,4096,14336,2,8,16,2,balanced,0.113946666320165
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,4096,14336,2,8,16,2,power_law_1.01,0.6677887916564942
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,4096,14336,2,8,16,2,balanced,2.4264960289001465
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,4096,14336,2,8,16,2,power_law_1.01,0.05581439733505249
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,4096,14336,2,8,16,2,balanced,2.5373759269714355
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,4096,14336,2,8,16,2,balanced,0.13868266344070435
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,4096,14336,2,8,16,2,power_law_1.01,0.9167167663574218
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,4096,14336,2,8,16,2,power_law_1.01,0.06679040193557739
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,4096,14336,2,8,16,2,balanced,0.20438933372497559
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,4096,14336,2,8,16,2,power_law_1.01,1.0670080184936523
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,4096,14336,2,8,16,2,power_law_1.01,0.07033600211143494
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,4096,14336,2,8,16,2,balanced,0.27668267488479614
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,4096,14336,2,8,16,2,power_law_1.01,1.7690752029418946
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,4096,14336,2,8,16,2,power_law_1.01,0.07514240145683289
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,4096,14336,2,8,16,2,balanced,0.40650665760040283
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,4096,14336,2,8,16,2,power_law_1.01,3.063212776184082
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,4096,14336,2,8,16,2,power_law_1.01,0.1043328046798706
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,4096,14336,2,8,16,2,balanced,0.5185759862263998
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,4096,14336,2,8,16,2,power_law_1.01,0.11641600131988525
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,4096,14336,2,8,16,2,power_law_1.01,0.16399359703063965
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,4096,14336,2,8,16,2,power_law_1.01,0.19471999406814575
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,4096,14336,2,8,16,2,power_law_1.01,0.3168256044387817
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,4096,14336,2,8,16,2,balanced,0.7904533545176188
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,4096,14336,2,8,16,2,power_law_1.01,0.43968000411987307
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,4096,14336,2,8,16,2,power_law_1.01,0.6484416007995606
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,4096,14336,2,8,16,2,balanced,1.0267253716786702
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,4096,14336,2,8,16,2,power_law_1.2,0.03877759873867035
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,4096,14336,2,8,16,2,power_law_1.01,0.786572790145874
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,4096,14336,2,8,16,2,power_law_1.2,0.03943040072917938
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,4096,14336,2,8,16,2,power_law_1.2,0.04042240083217621
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,4096,14336,2,8,16,2,power_law_1.01,1.148921585083008
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,4096,14336,2,8,16,2,balanced,1.2703999678293865
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,4096,14336,2,8,16,2,power_law_1.2,0.0493120014667511
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,4096,14336,2,8,16,2,power_law_1.01,1.6069759368896483
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,4096,14336,2,8,16,2,power_law_1.2,0.05135359764099121
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,4096,14336,2,8,16,2,power_law_1.01,1.879417610168457
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,4096,14336,2,8,16,2,power_law_1.2,0.05438079833984375
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,4096,14336,2,8,16,2,power_law_1.01,3.2197185516357423
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,4096,14336,2,8,16,2,balanced,2.0265013376871743
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,4096,14336,2,8,16,2,power_law_1.2,0.055270397663116456
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,4096,14336,2,8,16,2,power_law_1.01,5.9937278747558596
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,4096,14336,2,8,16,2,power_law_1.2,0.05494400262832642
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,4096,14336,2,8,16,2,power_law_1.2,0.05704960227012634
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,4096,14336,2,8,16,2,power_law_1.2,0.056992000341415404
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,4096,14336,2,8,16,2,power_law_1.2,0.05854719877243042
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,4096,14336,2,8,16,2,power_law_1.2,0.06042240262031555
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,4096,14336,2,8,16,2,balanced,4.009141286214192
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,4096,14336,2,8,16,2,power_law_1.2,0.06088320016860962
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,4096,14336,2,8,16,2,power_law_1.2,0.0692351996898651
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,4096,14336,2,8,16,2,power_law_1.2,0.08251519799232483
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,4096,14336,2,8,16,2,power_law_1.2,0.08655999898910523
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,4096,14336,2,8,16,2,power_law_1.2,0.08979840278625488
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,4096,14336,2,8,16,2,power_law_1.2,0.11360640525817871
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,4096,14336,2,8,16,2,power_law_1.2,0.03213439881801605
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,4096,14336,2,8,16,2,power_law_1.2,0.13089920282363893
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,4096,14336,2,8,16,2,power_law_1.2,0.033190399408340454
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,4096,14336,2,8,16,2,power_law_1.2,0.1720576047897339
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,4096,14336,2,8,16,2,power_law_1.2,0.03431679904460907
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,4096,14336,2,8,16,2,power_law_1.2,0.19644800424575806
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,4096,14336,2,8,16,2,power_law_1.2,0.03616639971733093
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,4096,14336,2,8,16,2,power_law_1.2,0.03640320003032684
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,4096,14336,2,8,16,2,power_law_1.2,0.23238399028778076
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,4096,14336,2,8,16,2,power_law_1.2,0.04132480025291443
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,4096,14336,2,8,16,2,power_law_1.2,0.30785279273986815
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,4096,14336,2,8,16,2,power_law_1.2,0.04333440065383911
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,4096,14336,2,8,16,2,power_law_1.2,0.04327679872512817
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,4096,14336,2,8,16,2,power_law_1.2,0.43859200477600097
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,4096,14336,2,8,16,2,power_law_1.2,0.04577920138835907
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,4096,14336,2,8,16,2,power_law_1.2,0.4315199851989746
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,4096,14336,2,8,16,2,power_law_1.2,0.05108479857444763
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,4096,14336,2,8,16,2,power_law_1.2,0.7228288173675537
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,4096,14336,2,8,16,2,power_law_1.2,0.048089599609375
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,4096,14336,2,8,16,2,power_law_1.2,1.1016192436218262
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,4096,14336,2,8,16,2,power_law_1.2,0.05067520141601563
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,4096,14336,2,8,16,2,power_law_1.2,0.05185279846191406
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,4096,14336,2,8,16,2,power_law_1.2,1.4505599975585937
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,4096,14336,2,8,16,2,power_law_1.2,0.05934079885482788
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,4096,14336,2,8,16,2,power_law_1.2,0.06689280271530151
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,4096,14336,2,8,16,2,power_law_1.2,2.201529693603516
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,4096,14336,2,8,16,2,power_law_1.2,0.06707199811935424
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,4096,14336,2,8,16,2,power_law_1.2,4.559750366210937
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,4096,14336,2,8,16,2,power_law_1.2,0.07360000014305115
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,4096,14336,2,8,16,2,power_law_1.2,0.088019198179245
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,4096,14336,2,8,16,2,power_law_1.2,0.10495359897613525
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,4096,14336,2,8,16,2,power_law_1.2,0.13525760173797607
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,4096,14336,2,8,16,2,power_law_1.2,0.156985604763031
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,4096,14336,2,8,16,2,power_law_1.2,0.20159358978271485
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,4096,14336,2,8,16,2,power_law_1.2,0.28012800216674805
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,4096,14336,2,8,16,2,power_law_1.2,0.37606399059295653
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,4096,14336,2,8,16,2,power_law_1.2,0.5490111827850341
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,4096,14336,2,8,16,2,power_law_1.2,0.7419328212738037
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,4096,14336,2,8,16,2,power_law_1.2,0.9358976364135743
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,4096,14336,2,8,16,2,power_law_1.2,1.2529600143432618
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,4096,14336,2,8,16,2,power_law_1.2,1.8886016845703124
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,4096,14336,2,8,16,2,power_law_1.2,3.527801513671875
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,4096,14336,2,8,32,1,balanced,0.033045334120591484
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,4096,14336,2,8,32,1,balanced,0.02995733420054118
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,4096,14336,2,8,32,1,balanced,0.03405333310365677
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,4096,14336,2,8,32,1,balanced,0.03885866701602936
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,4096,14336,2,8,32,1,balanced,0.03958400090535482
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,4096,14336,2,8,32,1,balanced,0.047024001677831016
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,4096,14336,2,8,32,1,balanced,0.040762667854626976
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,4096,14336,2,8,16,2,power_law_1.2,0.026668798923492432
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,4096,14336,2,8,32,1,balanced,0.049125333627065025
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,4096,14336,2,8,32,1,balanced,0.042026668787002563
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,4096,14336,2,8,32,1,balanced,0.05235733091831207
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,4096,14336,2,8,16,2,power_law_1.2,0.02805120050907135
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,4096,14336,2,8,32,1,balanced,0.04123199979464213
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,4096,14336,2,8,32,1,balanced,0.05130666494369507
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,4096,14336,2,8,16,2,power_law_1.2,0.02775680124759674
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,4096,14336,2,8,32,1,balanced,0.0425546665986379
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,4096,14336,2,8,32,1,balanced,0.052015999952952065
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,4096,14336,2,8,16,2,power_law_1.2,0.03203839957714081
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,4096,14336,2,8,32,1,balanced,0.04322133461634318
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,4096,14336,2,8,32,1,balanced,0.05420266588528951
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,4096,14336,2,8,16,2,power_law_1.2,0.03283199965953827
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,4096,14336,2,8,32,1,balanced,0.043552001317342125
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,4096,14336,2,8,32,1,balanced,0.05388799806435903
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,4096,14336,2,8,16,2,power_law_1.2,0.03717760145664215
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,4096,14336,2,8,32,1,balanced,0.02739199995994568
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,4096,14336,2,8,32,1,balanced,0.054058666030565895
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,4096,14336,2,8,32,1,balanced,0.04544533292452494
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,4096,14336,2,8,16,2,power_law_1.2,0.03993600010871887
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,4096,14336,2,8,32,1,balanced,0.05667733152707418
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,4096,14336,2,8,32,1,balanced,0.02811199923356374
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,4096,14336,2,8,32,1,balanced,0.047168001532554626
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,4096,14336,2,8,32,1,balanced,0.03249066571394602
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,4096,14336,2,8,16,2,power_law_1.2,0.041203200817108154
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,4096,14336,2,8,32,1,balanced,0.05877333382765452
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,4096,14336,2,8,32,1,balanced,0.03389866650104523
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,4096,14336,2,8,32,1,balanced,0.0496319979429245
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,4096,14336,2,8,32,1,balanced,0.03676799933115641
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,4096,14336,2,8,32,1,balanced,0.05905599892139435
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,4096,14336,2,8,32,1,balanced,0.051039998730023704
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,4096,14336,2,8,32,1,balanced,0.03746666759252548
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,4096,14336,2,8,16,2,power_law_1.2,0.04764800071716309
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,4096,14336,2,8,32,1,balanced,0.06141866743564606
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,4096,14336,2,8,32,1,balanced,0.03846933444341024
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,4096,14336,2,8,32,1,balanced,0.053114667534828186
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,4096,14336,2,8,32,1,balanced,0.03972800076007843
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,4096,14336,2,8,32,1,balanced,0.07166400055090587
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,4096,14336,2,8,16,2,power_law_1.2,0.04748800098896026
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,4096,14336,2,8,32,1,balanced,0.06322133541107178
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,4096,14336,2,8,32,1,balanced,0.07376533250013988
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,4096,14336,2,8,32,1,balanced,0.04404800136884054
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,4096,14336,2,8,32,1,balanced,0.06423999865849812
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,4096,14336,2,8,32,1,balanced,0.07620800038178761
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,4096,14336,2,8,32,1,balanced,0.04558933277924856
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,4096,14336,2,8,16,2,power_law_1.2,0.050963199138641356
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,4096,14336,2,8,32,1,balanced,0.06805333495140076
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,4096,14336,2,8,32,1,balanced,0.09549333651860555
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,4096,14336,2,8,32,1,power_law_1.01,0.034745600819587705
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,4096,14336,2,8,16,2,power_law_1.2,0.052767997980117796
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,4096,14336,2,8,32,1,balanced,0.08640000224113464
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,4096,14336,2,8,32,1,balanced,0.09622400005658467
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,4096,14336,2,8,16,2,power_law_1.2,0.054611200094223024
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,4096,14336,2,8,32,1,power_law_1.01,0.03666560053825378
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,4096,14336,2,8,32,1,balanced,0.09108266234397888
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,4096,14336,2,8,32,1,balanced,0.1285599966843923
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,4096,14336,2,8,32,1,power_law_1.01,0.03949440121650696
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,4096,14336,2,8,16,2,power_law_1.2,0.06101760268211365
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,4096,14336,2,8,32,1,balanced,0.11782933274904887
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,4096,14336,2,8,32,1,balanced,0.14528533816337585
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,4096,14336,2,8,32,1,balanced,0.047600001096725464
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,4096,14336,2,8,32,1,power_law_1.01,0.04778240025043488
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,4096,14336,2,8,32,1,balanced,0.049973333875338234
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,4096,14336,2,8,32,1,balanced,0.13758400082588196
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,4096,14336,2,8,32,1,balanced,0.20251200596491495
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,4096,14336,2,8,16,2,power_law_1.2,0.06954240202903747
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,4096,14336,2,8,32,1,power_law_1.01,0.05118079781532288
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,4096,14336,2,8,32,1,balanced,0.05300800005594889
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,4096,14336,2,8,32,1,balanced,0.055311997731526695
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,4096,14336,2,8,32,1,power_law_1.01,0.053414398431777955
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,4096,14336,2,8,16,2,power_law_1.2,0.07507839798927307
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,4096,14336,2,8,32,1,balanced,0.1943626602490743
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,4096,14336,2,8,32,1,balanced,0.253983994325002
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,4096,14336,2,8,32,1,power_law_1.01,0.055308800935745236
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,4096,14336,2,8,16,2,power_law_1.2,0.08488960266113281
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,4096,14336,2,8,32,1,power_law_1.01,0.03255679905414581
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,4096,14336,2,8,32,1,balanced,0.24460800488789877
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,4096,14336,2,8,32,1,balanced,0.36982401212056476
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,4096,14336,2,8,32,1,power_law_1.01,0.056358402967453
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,4096,14336,2,8,32,1,balanced,0.06817600131034851
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,4096,14336,2,8,32,1,power_law_1.01,0.03304960131645203
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,4096,14336,2,8,32,1,power_law_1.01,0.05733759999275208
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,4096,14336,2,8,16,2,power_law_1.2,0.10906879901885987
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,4096,14336,2,8,32,1,balanced,0.3646986484527588
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,4096,14336,2,8,32,1,balanced,0.07060799996058147
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,4096,14336,2,8,32,1,balanced,0.481056014696757
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,4096,14336,2,8,32,1,power_law_1.01,0.05880320072174072
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,4096,14336,2,8,32,1,power_law_1.01,0.034246399998664856
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,4096,14336,2,8,32,1,balanced,0.0765226682027181
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,4096,14336,2,8,16,2,power_law_1.2,0.13347840309143066
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,4096,14336,2,8,32,1,power_law_1.01,0.060550397634506224
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,4096,14336,2,8,32,1,power_law_1.01,0.039724799990653994
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,4096,14336,2,8,32,1,balanced,0.4734400113423665
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,4096,14336,2,8,32,1,balanced,0.707530657450358
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,4096,14336,2,8,32,1,power_law_1.01,0.040038400888442995
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,4096,14336,2,8,32,1,power_law_1.01,0.062003201246261595
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,4096,14336,2,8,16,2,power_law_1.2,0.17827199697494506
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,4096,14336,2,8,32,1,power_law_1.01,0.04317440092563629
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,4096,14336,2,8,16,2,power_law_1.2,0.21619200706481934
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,4096,14336,2,8,32,1,power_law_1.01,0.0642687976360321
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,4096,14336,2,8,32,1,balanced,0.6877013047536215
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,4096,14336,2,8,32,1,balanced,0.1018399993578593
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,4096,14336,2,8,32,1,power_law_1.01,0.04392319917678833
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,4096,14336,2,8,16,2,power_law_1.2,0.3558464050292969
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,4096,14336,2,8,32,1,balanced,0.11572800079981486
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,4096,14336,2,8,32,1,power_law_1.01,0.06976640224456787
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,4096,14336,2,8,32,1,balanced,0.8728586832682291
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,4096,14336,2,8,32,1,power_law_1.01,0.04556800127029419
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,4096,14336,2,8,16,2,power_law_1.2,0.44677119255065917
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,4096,14336,2,8,32,1,power_law_1.01,0.07631999850273133
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,4096,14336,2,8,32,1,balanced,0.8745546340942383
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,4096,14336,2,8,32,1,power_law_1.01,0.04552319943904877
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,4096,14336,2,8,16,2,power_law_1.2,0.7045631885528565
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,4096,14336,2,8,32,1,power_law_1.01,0.08414720296859741
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,4096,14336,2,8,32,1,power_law_1.01,0.04683519899845123
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,4096,14336,2,8,32,1,balanced,0.17231466372807822
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,4096,14336,2,8,32,1,power_law_1.01,0.0865664005279541
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,4096,14336,2,8,16,2,power_law_1.2,0.7004608154296875
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,4096,14336,2,8,32,1,balanced,1.0875786940256755
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,4096,14336,2,8,32,1,power_law_1.01,0.04935039877891541
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,4096,14336,2,8,32,1,power_law_1.01,0.11435519456863404
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,4096,14336,2,8,32,1,balanced,0.22778133551279703
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,4096,14336,2,8,32,1,balanced,1.0858453114827473
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,4096,14336,2,8,32,1,power_law_1.01,0.05190399885177612
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,4096,14336,2,8,32,1,power_law_1.01,0.11650559902191163
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,4096,14336,2,8,16,2,power_law_1.2,1.2550527572631835
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,4096,14336,2,8,32,1,balanced,0.32952000697453815
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,4096,14336,2,8,32,1,power_law_1.01,0.05305600166320801
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,4096,14336,2,8,32,1,power_law_1.01,0.1431167960166931
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,4096,14336,2,8,16,2,power_law_1.2,1.5157376289367677
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,4096,14336,2,8,32,1,balanced,0.4285759925842285
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,4096,14336,2,8,32,1,power_law_1.01,0.06050559878349304
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,4096,14336,2,8,32,1,power_law_1.01,0.16670080423355102
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,4096,14336,2,8,32,1,balanced,1.739456017812093
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,4096,14336,2,8,32,1,power_law_1.01,0.06629120111465454
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,4096,14336,2,8,16,2,power_law_1.2,2.0264511108398438
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,4096,14336,2,8,32,1,balanced,0.6267040173212687
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,4096,14336,2,8,32,1,power_law_1.01,0.22410240173339843
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,4096,14336,2,8,32,1,power_law_1.01,0.07070720195770264
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,4096,14336,2,8,32,1,balanced,1.7021546363830566
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,4096,14336,2,8,16,2,power_law_1.2,3.3305919647216795
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,4096,14336,2,8,32,1,balanced,0.8202880223592123
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,4096,14336,2,8,32,1,power_law_1.01,0.26759040355682373
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,4096,14336,2,8,32,1,power_law_1.01,0.07653759717941284
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,4096,14336,2,8,32,1,power_law_1.01,0.37502079010009765
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,4096,14336,2,8,32,1,power_law_1.01,0.08959360122680664
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,4096,14336,2,8,16,2,power_law_1.2,7.209248352050781
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,4096,14336,2,8,32,1,balanced,1.2307093143463135
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,4096,14336,2,8,32,1,power_law_1.01,0.4825727939605713
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,4096,14336,2,8,32,1,power_law_1.01,0.1027008056640625
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,4096,14336,2,8,32,1,power_law_1.01,0.12922240495681764
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,4096,14336,2,8,32,1,power_law_1.01,0.6940032005310058
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,4096,14336,2,8,32,1,power_law_1.01,0.1497599959373474
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,4096,14336,2,8,32,1,power_law_1.01,0.9127488136291504
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,4096,14336,2,8,32,1,balanced,1.6293546358744304
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,4096,14336,2,8,32,1,power_law_1.01,0.20515840053558348
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,4096,14336,2,8,32,1,power_law_1.01,1.1240063667297364
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,4096,14336,2,8,32,1,balanced,3.28767999013265
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,4096,14336,2,8,32,1,power_law_1.01,0.2566080093383789
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,4096,14336,2,8,32,1,balanced,3.4061279296875
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,4096,14336,2,8,32,1,power_law_1.01,1.8009983062744142
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,4096,14336,2,8,32,1,balanced,2.018261273701986
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,4096,14336,2,8,32,1,power_law_1.01,0.3592639923095703
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,4096,14336,2,8,32,1,power_law_1.01,0.02691200077533722
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,4096,14336,2,8,32,1,power_law_1.01,3.2819969177246096
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,4096,14336,2,8,32,1,power_law_1.01,0.46494078636169434
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,4096,14336,2,8,32,1,power_law_1.01,0.027961599826812743
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,4096,14336,2,8,32,1,power_law_1.01,0.6775487899780274
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,4096,14336,2,8,32,1,power_law_1.01,0.028806400299072266
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,4096,14336,2,8,32,1,balanced,3.2028001149495444
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,4096,14336,2,8,32,1,power_law_1.01,0.9001791954040528
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,4096,14336,2,8,32,1,power_law_1.01,0.03395200073719025
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,4096,14336,2,8,32,1,power_law_1.01,1.1041600227355957
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,4096,14336,2,8,32,1,power_law_1.01,0.03473280072212219
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,4096,14336,2,8,32,1,power_law_1.2,0.03421440124511719
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,4096,14336,2,8,32,1,power_law_1.01,1.7440256118774413
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,4096,14336,2,8,32,1,power_law_1.01,0.03939839899539947
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,4096,14336,2,8,32,1,power_law_1.2,0.036601600050926206
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,4096,14336,2,8,32,1,power_law_1.01,3.3111103057861326
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,4096,14336,2,8,32,1,power_law_1.01,0.04095360040664673
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,4096,14336,2,8,32,1,power_law_1.2,0.03758719861507416
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,4096,14336,2,8,32,1,power_law_1.2,0.04679040014743805
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,4096,14336,2,8,32,1,power_law_1.01,0.04384639859199524
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,4096,14336,2,8,32,1,power_law_1.2,0.05063679814338684
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,4096,14336,2,8,32,1,power_law_1.2,0.052300798892974856
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,4096,14336,2,8,32,1,power_law_1.2,0.05497599840164184
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,4096,14336,2,8,32,1,balanced,6.353450775146484
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,4096,14336,2,8,32,1,power_law_1.01,0.04408319890499115
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,4096,14336,2,8,32,1,power_law_1.2,0.05639680027961731
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,4096,14336,2,8,32,1,power_law_1.01,0.046003198623657225
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,4096,14336,2,8,32,1,power_law_1.2,0.05633280277252197
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,4096,14336,2,8,32,1,power_law_1.2,0.05802879929542541
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,4096,14336,2,8,32,1,power_law_1.2,0.058297598361968996
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,4096,14336,2,8,32,1,power_law_1.01,0.05334399938583374
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,4096,14336,2,8,32,1,power_law_1.2,0.06139519810676575
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,4096,14336,2,8,32,1,power_law_1.01,0.05675519704818725
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,4096,14336,2,8,32,1,power_law_1.2,0.06279680132865906
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,4096,14336,2,8,32,1,power_law_1.2,0.06931840181350708
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,4096,14336,2,8,32,1,power_law_1.01,0.0591871976852417
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,4096,14336,2,8,32,1,power_law_1.2,0.07683839797973632
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,4096,14336,2,8,32,1,power_law_1.01,0.0633791983127594
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,4096,14336,2,8,32,1,power_law_1.2,0.08579199910163879
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,4096,14336,2,8,32,1,power_law_1.2,0.08393599987030029
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,4096,14336,2,8,32,1,power_law_1.01,0.0756928026676178
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,4096,14336,2,8,32,1,power_law_1.2,0.10390399694442749
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,4096,14336,2,8,32,1,power_law_1.01,0.07849599719047547
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,4096,14336,2,8,32,1,power_law_1.2,0.11580799818038941
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,4096,14336,2,8,32,1,power_law_1.2,0.14600319862365724
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,4096,14336,2,8,32,1,power_law_1.01,0.08828160166740417
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,4096,14336,2,8,32,1,power_law_1.2,0.16917120218276976
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,4096,14336,2,8,32,1,power_law_1.2,0.2246016025543213
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,4096,14336,2,8,32,1,power_law_1.01,0.11023999452590942
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,4096,14336,2,8,32,1,power_law_1.2,0.26711039543151854
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,4096,14336,2,8,32,1,power_law_1.01,0.13076479434967042
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,4096,14336,2,8,32,1,power_law_1.2,0.3747584104537964
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,4096,14336,2,8,32,1,power_law_1.2,0.477843189239502
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,4096,14336,2,8,32,1,power_law_1.01,0.1826815962791443
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,4096,14336,2,8,32,1,power_law_1.01,0.24225919246673583
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,4096,14336,2,8,32,1,power_law_1.2,0.6948991775512695
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,4096,14336,2,8,32,1,power_law_1.2,0.9308095932006836
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,4096,14336,2,8,32,1,power_law_1.01,0.3457855939865112
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,4096,14336,2,8,32,1,power_law_1.2,1.128998374938965
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,4096,14336,2,8,32,1,power_law_1.01,0.44464640617370604
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,4096,14336,2,8,32,1,power_law_1.2,1.7924224853515625
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,4096,14336,2,8,32,1,power_law_1.01,0.642739200592041
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,4096,14336,2,8,32,1,power_law_1.2,3.2821376800537108
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,4096,14336,2,8,32,1,power_law_1.01,0.8342464447021485
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,4096,14336,2,8,32,1,power_law_1.01,1.233779239654541
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,4096,14336,2,8,32,1,power_law_1.01,1.6306751251220704
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,4096,14336,2,8,32,1,power_law_1.01,2.03056640625
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,4096,14336,2,8,32,1,power_law_1.01,3.2106624603271485
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,4096,14336,2,8,32,1,power_law_1.01,6.351571273803711
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,4096,14336,2,8,32,1,power_law_1.2,0.0335999995470047
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,4096,14336,2,8,32,1,power_law_1.2,0.032595199346542356
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,6144,16384,2,8,4,8,balanced,0.07492266595363617
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,4096,14336,2,8,32,1,power_law_1.2,0.03444480001926422
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,6144,16384,2,8,4,8,balanced,0.0703359991312027
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,4096,14336,2,8,32,1,power_law_1.2,0.03954559862613678
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,6144,16384,2,8,4,8,balanced,0.06589866677920024
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,4096,14336,2,8,32,1,power_law_1.2,0.039955198764801025
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,6144,16384,2,8,4,8,balanced,0.06803733110427856
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,4096,14336,2,8,32,1,power_law_1.2,0.04336639940738678
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,6144,16384,2,8,4,8,balanced,0.07001600166161855
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,4096,14336,2,8,32,1,power_law_1.2,0.02682879865169525
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,4096,14336,2,8,32,1,power_law_1.2,0.04447999894618988
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,6144,16384,2,8,4,8,balanced,0.05046933392683665
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,4096,14336,2,8,32,1,power_law_1.2,0.045049598813056944
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,6144,16384,2,8,4,8,balanced,0.07056533296902974
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,4096,14336,2,8,32,1,power_law_1.2,0.027577599883079527
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,6144,16384,2,8,4,8,balanced,0.054458667834599815
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,4096,14336,2,8,32,1,power_law_1.2,0.045561599731445315
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,6144,16384,2,8,4,8,balanced,0.0699839989344279
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,6144,16384,2,8,4,8,balanced,0.04885333279768626
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,4096,14336,2,8,32,1,power_law_1.2,0.027635198831558228
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,4096,14336,2,8,32,1,power_law_1.2,0.046387198567390445
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,6144,16384,2,8,4,8,balanced,0.050853331883748375
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,6144,16384,2,8,4,8,balanced,0.07124266525109609
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,4096,14336,2,8,32,1,power_law_1.2,0.03498879969120026
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,6144,16384,2,8,4,8,balanced,0.05221333106358846
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,4096,14336,2,8,32,1,power_law_1.2,0.048614400625228885
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,6144,16384,2,8,4,8,balanced,0.07027733325958252
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,6144,16384,2,8,4,8,balanced,0.05296533306439718
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,4096,14336,2,8,32,1,power_law_1.2,0.035622400045394895
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,4096,14336,2,8,32,1,power_law_1.2,0.05177599787712097
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,6144,16384,2,8,4,8,balanced,0.05320533116658529
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,6144,16384,2,8,4,8,balanced,0.07035199801127116
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,6144,16384,2,8,4,8,balanced,0.054042667150497437
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,4096,14336,2,8,32,1,power_law_1.2,0.038975998759269714
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,4096,14336,2,8,32,1,power_law_1.2,0.05253120064735413
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,6144,16384,2,8,4,8,balanced,0.05269866685072581
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,6144,16384,2,8,4,8,balanced,0.08029333253701527
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,4096,14336,2,8,32,1,power_law_1.2,0.04095360040664673
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,4096,14336,2,8,32,1,power_law_1.2,0.059571200609207155
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,6144,16384,2,8,4,8,balanced,0.05462400118509928
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,6144,16384,2,8,4,8,balanced,0.07331733405590057
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,6144,16384,2,8,4,8,power_law_1.01,0.07382400035858154
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,6144,16384,2,8,4,8,balanced,0.05641599992911021
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,4096,14336,2,8,32,1,power_law_1.2,0.06706560254096985
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,4096,14336,2,8,32,1,power_law_1.2,0.04262399971485138
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,6144,16384,2,8,4,8,balanced,0.05491200089454651
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,6144,16384,2,8,4,8,balanced,0.07355733215808868
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,6144,16384,2,8,4,8,power_law_1.01,0.06961280107498169
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,6144,16384,2,8,4,8,balanced,0.05601066847642263
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,4096,14336,2,8,32,1,power_law_1.2,0.07066239714622498
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,6144,16384,2,8,4,8,balanced,0.04448533554871877
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,6144,16384,2,8,4,8,balanced,0.05762133498986562
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,6144,16384,2,8,4,8,balanced,0.07354666789372762
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,6144,16384,2,8,4,8,power_law_1.01,0.06611199975013733
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,4096,14336,2,8,32,1,power_law_1.2,0.07434880137443542
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,4096,14336,2,8,32,1,power_law_1.2,0.04410879909992218
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,6144,16384,2,8,4,8,balanced,0.07136000196139018
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,6144,16384,2,8,4,8,balanced,0.04284800092379252
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,6144,16384,2,8,4,8,balanced,0.0983786682287852
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,6144,16384,2,8,4,8,balanced,0.07292800148328145
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,6144,16384,2,8,4,8,power_law_1.01,0.067603200674057
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,4096,14336,2,8,32,1,power_law_1.2,0.0884223997592926
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,4096,14336,2,8,32,1,power_law_1.2,0.046540799736976626
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,6144,16384,2,8,4,8,balanced,0.04262933135032654
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,6144,16384,2,8,4,8,balanced,0.07100266714890797
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,6144,16384,2,8,4,8,balanced,0.0969493289788564
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,6144,16384,2,8,4,8,power_law_1.01,0.06862080097198486
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,4096,14336,2,8,32,1,power_law_1.2,0.09934719800949096
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,6144,16384,2,8,4,8,balanced,0.08847467104593913
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,6144,16384,2,8,4,8,balanced,0.04566933214664459
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,6144,16384,2,8,4,8,power_law_1.01,0.07137280106544494
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,6144,16384,2,8,4,8,balanced,0.08553066849708557
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,6144,16384,2,8,4,8,balanced,0.08726933598518372
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,4096,14336,2,8,32,1,power_law_1.2,0.12845439910888673
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,4096,14336,2,8,32,1,power_law_1.2,0.053350400924682614
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,6144,16384,2,8,4,8,balanced,0.04699199895064036
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,6144,16384,2,8,4,8,balanced,0.13033599654833475
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,6144,16384,2,8,4,8,power_law_1.01,0.07525119781494141
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,6144,16384,2,8,4,8,balanced,0.11127466956774394
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,4096,14336,2,8,32,1,power_law_1.2,0.14999040365219116
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,6144,16384,2,8,4,8,balanced,0.13378666838010153
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,4096,14336,2,8,32,1,power_law_1.2,0.056595200300216676
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,6144,16384,2,8,4,8,balanced,0.04710933566093445
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,6144,16384,2,8,4,8,power_law_1.01,0.07870720028877258
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,4096,14336,2,8,32,1,power_law_1.2,0.20580480098724366
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,6144,16384,2,8,4,8,balanced,0.10280000170071919
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,6144,16384,2,8,4,8,balanced,0.19402666886647543
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,6144,16384,2,8,4,8,power_law_1.01,0.08430079817771911
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,4096,14336,2,8,32,1,power_law_1.2,0.05939840078353882
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,6144,16384,2,8,4,8,balanced,0.047007997830708824
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,4096,14336,2,8,32,1,power_law_1.2,0.2546816110610962
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,6144,16384,2,8,4,8,balanced,0.20957332849502563
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,6144,16384,2,8,4,8,balanced,0.1704746683438619
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,6144,16384,2,8,4,8,power_law_1.01,0.09007999897003174
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,4096,14336,2,8,32,1,power_law_1.2,0.06312959790229797
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,6144,16384,2,8,4,8,balanced,0.04684266448020935
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,4096,14336,2,8,32,1,power_law_1.2,0.35936000347137453
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,6144,16384,2,8,4,8,balanced,0.2996799945831299
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,6144,16384,2,8,4,8,balanced,0.1462399959564209
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,6144,16384,2,8,4,8,power_law_1.01,0.0844223976135254
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,6144,16384,2,8,4,8,balanced,0.05208533505598704
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,4096,14336,2,8,32,1,power_law_1.2,0.4658368110656738
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,6144,16384,2,8,4,8,power_law_1.01,0.10646400451660157
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,4096,14336,2,8,32,1,power_law_1.2,0.07618560194969178
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,6144,16384,2,8,4,8,balanced,0.3758560021718343
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,6144,16384,2,8,4,8,balanced,0.05314666529496511
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,6144,16384,2,8,4,8,balanced,0.2513599991798401
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,4096,14336,2,8,32,1,power_law_1.2,0.6768959999084473
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,6144,16384,2,8,4,8,power_law_1.01,0.10088319778442383
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,4096,14336,2,8,32,1,power_law_1.2,0.07900800108909607
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,6144,16384,2,8,4,8,balanced,0.258735994497935
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,6144,16384,2,8,4,8,power_law_1.01,0.1223039984703064
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,4096,14336,2,8,32,1,power_law_1.2,0.9120448112487793
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,6144,16384,2,8,4,8,balanced,0.5546453396479288
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,4096,14336,2,8,32,1,power_law_1.2,0.08762879967689514
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,6144,16384,2,8,4,8,power_law_1.01,0.140665602684021
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,4096,14336,2,8,32,1,power_law_1.2,1.1042559623718262
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,6144,16384,2,8,4,8,balanced,0.3701813220977783
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,6144,16384,2,8,4,8,power_law_1.01,0.1589568018913269
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,4096,14336,2,8,32,1,power_law_1.2,0.11204479932785034
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,6144,16384,2,8,4,8,balanced,0.7127093474070231
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,4096,14336,2,8,32,1,power_law_1.2,1.7546239852905274
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,6144,16384,2,8,4,8,power_law_1.01,0.17921279668807982
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,6144,16384,2,8,4,8,balanced,0.050288001696268715
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,4096,14336,2,8,32,1,power_law_1.2,0.13139840364456176
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,6144,16384,2,8,4,8,balanced,0.4392640193303426
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,6144,16384,2,8,4,8,power_law_1.01,0.24792959690093994
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,4096,14336,2,8,32,1,power_law_1.2,3.3054271697998048
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,6144,16384,2,8,4,8,balanced,0.05137600004673004
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,6144,16384,2,8,4,8,power_law_1.01,0.2625344038009644
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,6144,16384,2,8,4,8,balanced,0.8963946501413981
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,4096,14336,2,8,32,1,power_law_1.2,0.18305280208587646
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,6144,16384,2,8,4,8,balanced,0.052757332722345986
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,6144,16384,2,8,4,8,power_law_1.01,0.39686400890350343
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,6144,16384,2,8,4,8,balanced,0.6614133516947428
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,6144,16384,2,8,4,8,balanced,0.05169066786766052
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,4096,14336,2,8,32,1,power_law_1.2,0.24124159812927246
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,6144,16384,2,8,4,8,power_law_1.01,0.4225855827331543
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,4096,14336,2,8,32,1,power_law_1.2,0.34528000354766847
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,6144,16384,2,8,4,8,power_law_1.01,0.5821055889129638
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,6144,16384,2,8,4,8,balanced,0.8415466944376627
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,6144,16384,2,8,4,8,balanced,1.3793120384216309
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,6144,16384,2,8,4,8,power_law_1.01,0.7859007835388183
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,4096,14336,2,8,32,1,power_law_1.2,0.44313597679138184
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,6144,16384,2,8,4,8,power_law_1.01,0.04916479885578155
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,6144,16384,2,8,4,8,power_law_1.01,1.0636992454528809
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,4096,14336,2,8,32,1,power_law_1.2,0.641593599319458
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,6144,16384,2,8,4,8,power_law_1.01,0.0470335990190506
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,6144,16384,2,8,4,8,power_law_1.01,1.470579242706299
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,4096,14336,2,8,32,1,power_law_1.2,0.8317824363708496
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,6144,16384,2,8,4,8,balanced,0.060229331254959106
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,6144,16384,2,8,4,8,power_law_1.01,0.047065600752830505
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,6144,16384,2,8,4,8,balanced,1.0620533625284831
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,6144,16384,2,8,4,8,power_law_1.01,2.167308807373047
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,6144,16384,2,8,4,8,balanced,0.060645331939061485
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,4096,14336,2,8,32,1,power_law_1.2,1.2331392288208007
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,6144,16384,2,8,4,8,power_law_1.01,0.05021439790725708
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,6144,16384,2,8,4,8,power_law_1.01,2.6685375213623046
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,6144,16384,2,8,4,8,balanced,0.06225066880385081
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,6144,16384,2,8,4,8,power_law_1.01,0.05011199712753296
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,4096,14336,2,8,32,1,power_law_1.2,1.6256704330444336
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,6144,16384,2,8,4,8,power_law_1.01,3.5266239166259767
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,6144,16384,2,8,4,8,power_law_1.01,0.055302399396896365
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,4096,14336,2,8,32,1,power_law_1.2,2.0266111373901365
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,6144,16384,2,8,4,8,balanced,2.7160800298055015
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,6144,16384,2,8,4,8,balanced,1.642133394877116
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,6144,16384,2,8,4,8,power_law_1.01,0.06518399715423584
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,6144,16384,2,8,4,8,power_law_1.01,5.92229118347168
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,4096,14336,2,8,32,1,power_law_1.2,3.2042686462402346
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,6144,16384,2,8,4,8,power_law_1.01,0.05863040089607239
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,6144,16384,2,8,4,8,power_law_1.01,12.084102630615234
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,6144,16384,2,8,4,8,power_law_1.01,0.0585919976234436
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,4096,14336,2,8,32,1,power_law_1.2,6.34730224609375
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,6144,16384,2,8,4,8,power_law_1.01,0.04373759925365448
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,6144,16384,2,8,4,8,power_law_1.01,0.06424319744110107
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,6144,16384,2,8,4,8,balanced,0.0775733341773351
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,6144,16384,2,8,4,8,power_law_1.01,0.042771199345588685
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,6144,16384,2,8,4,8,power_law_1.01,0.06348159909248352
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,6144,16384,2,8,4,8,balanced,0.08101866642634074
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,6144,16384,2,8,4,8,power_law_1.01,0.042559999227523806
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,6144,16384,2,8,4,8,power_law_1.01,0.06744959950447083
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,6144,16384,2,8,4,8,power_law_1.01,0.0456959992647171
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,6144,16384,2,8,4,8,power_law_1.01,0.06997759938240052
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,6144,16384,2,8,4,8,balanced,3.246373176574707
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,6144,16384,2,8,4,8,power_law_1.01,0.04642559885978699
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,6144,16384,2,8,4,8,power_law_1.01,0.08335360288619995
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,6144,16384,2,8,4,8,power_law_1.01,0.0973695993423462
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,6144,16384,2,8,4,8,power_law_1.01,0.05041279792785645
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,6144,16384,2,8,4,8,power_law_1.01,0.11144319772720337
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,6144,16384,2,8,4,8,power_law_1.01,0.06632959842681885
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,6144,16384,2,8,4,8,balanced,0.11071999867757161
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,6144,16384,2,8,4,8,power_law_1.01,0.06238080263137817
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,6144,16384,2,8,4,8,power_law_1.01,0.12179839611053467
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,6144,16384,2,8,4,8,balanced,0.12888532876968384
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,6144,16384,2,8,4,8,power_law_1.01,0.07125759720802308
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,6144,16384,2,8,4,8,power_law_1.01,0.16785919666290283
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,6144,16384,2,8,4,8,power_law_1.01,0.07051519751548767
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,6144,16384,2,8,4,8,power_law_1.01,0.18486399650573732
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,6144,16384,2,8,4,8,balanced,0.18033599853515625
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,6144,16384,2,8,4,8,power_law_1.01,0.2246079921722412
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,6144,16384,2,8,4,8,power_law_1.01,0.30690560340881345
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,6144,16384,2,8,4,8,balanced,0.21793067455291748
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,6144,16384,2,8,4,8,power_law_1.01,0.0635968029499054
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,6144,16384,2,8,4,8,power_law_1.01,0.46600961685180664
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,6144,16384,2,8,4,8,power_law_1.01,0.07593600153923034
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,6144,16384,2,8,4,8,power_law_1.01,0.5064320087432861
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,6144,16384,2,8,4,8,power_law_1.01,0.07739520072937012
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,6144,16384,2,8,4,8,power_law_1.01,0.7530752182006836
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,6144,16384,2,8,4,8,power_law_1.01,0.08414720296859741
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,6144,16384,2,8,4,8,balanced,0.32146666447321576
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,6144,16384,2,8,4,8,power_law_1.01,0.8798591613769531
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,6144,16384,2,8,4,8,power_law_1.01,1.3871808052062988
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,6144,16384,2,8,4,8,balanced,0.42085333665211994
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,6144,16384,2,8,4,8,power_law_1.01,0.08654720187187195
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,6144,16384,2,8,4,8,power_law_1.01,1.976576042175293
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,6144,16384,2,8,4,8,power_law_1.01,0.10261759757995606
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,6144,16384,2,8,4,8,balanced,0.6432586510976156
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,6144,16384,2,8,4,8,power_law_1.01,2.544486427307129
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,6144,16384,2,8,4,8,power_law_1.01,0.12799359560012818
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,6144,16384,2,8,4,8,power_law_1.01,3.6059200286865236
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,6144,16384,2,8,4,8,power_law_1.01,0.15843199491500853
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,6144,16384,2,8,4,8,balanced,0.8533066908518473
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,6144,16384,2,8,4,8,power_law_1.01,7.511603546142578
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,6144,16384,2,8,4,8,power_law_1.01,0.1728000044822693
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,6144,16384,2,8,4,8,balanced,1.0552373727162678
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,6144,16384,2,8,4,8,power_law_1.01,0.2736128091812134
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,6144,16384,2,8,4,8,power_law_1.01,0.38514559268951415
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,6144,16384,2,8,4,8,power_law_1.01,0.5363391876220703
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,6144,16384,2,8,4,8,balanced,1.6644426981608074
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,6144,16384,2,8,4,8,power_law_1.01,0.74967041015625
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,6144,16384,2,8,4,8,power_law_1.01,1.0918463706970214
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,6144,16384,2,8,4,8,power_law_1.01,1.506809616088867
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,6144,16384,2,8,4,8,power_law_1.01,2.2196928024291993
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,6144,16384,2,8,4,8,power_law_1.01,2.758880043029785
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,6144,16384,2,8,4,8,balanced,3.2521387736002603
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,6144,16384,2,8,4,8,power_law_1.01,3.608198547363281
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,6144,16384,2,8,4,8,power_law_1.01,5.91253776550293
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,6144,16384,2,8,4,8,power_law_1.01,11.69459228515625
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,6144,16384,2,8,4,8,power_law_1.2,0.07395840287208558
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,6144,16384,2,8,4,8,power_law_1.2,0.06980479955673217
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,6144,16384,2,8,4,8,power_law_1.2,0.06594560146331788
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,6144,16384,2,8,4,8,power_law_1.2,0.06848000288009644
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,6144,16384,2,8,4,8,power_law_1.2,0.06833279728889466
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,6144,16384,2,8,4,8,power_law_1.2,0.07175679802894593
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,6144,16384,2,8,4,8,power_law_1.2,0.049907198548316954
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,6144,16384,2,8,4,8,power_law_1.2,0.08502399921417236
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,6144,16384,2,8,4,8,power_law_1.2,0.05319679975509643
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,6144,16384,2,8,4,8,power_law_1.2,0.07885439991950989
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,6144,16384,2,8,4,8,power_law_1.2,0.04828799962997436
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,6144,16384,2,8,4,8,power_law_1.2,0.09359359741210938
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,6144,16384,2,8,4,8,power_law_1.2,0.05107839703559876
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,6144,16384,2,8,4,8,power_law_1.2,0.1078976035118103
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,6144,16384,2,8,4,8,power_law_1.2,0.08471680283546448
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,6144,16384,2,8,4,8,power_law_1.2,0.05159040093421936
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,6144,16384,2,8,4,8,power_law_1.2,0.10359040498733521
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,6144,16384,2,8,4,8,power_law_1.2,0.0547327995300293
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,6144,16384,2,8,4,8,power_law_1.2,0.10026240348815918
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,6144,16384,2,8,4,8,power_law_1.2,0.06268159747123718
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,6144,16384,2,8,4,8,power_law_1.2,0.12042880058288574
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,6144,16384,2,8,4,8,power_law_1.2,0.058323198556900026
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,6144,16384,2,8,8,4,balanced,0.05504000186920166
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,6144,16384,2,8,4,8,power_law_1.2,0.14789119958877564
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,6144,16384,2,8,4,8,power_law_1.2,0.060134398937225345
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,6144,16384,2,8,4,8,power_law_1.2,0.164300799369812
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,6144,16384,2,8,8,4,balanced,0.04991999765237173
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,6144,16384,2,8,8,4,balanced,0.04141866664091746
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,6144,16384,2,8,4,8,power_law_1.2,0.06543359756469727
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,6144,16384,2,8,4,8,power_law_1.2,0.043673598766326906
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,6144,16384,2,8,4,8,power_law_1.2,0.18448640108108522
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,6144,16384,2,8,8,4,balanced,0.06371200084686279
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,6144,16384,2,8,8,4,balanced,0.04112533231576284
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,6144,16384,2,8,4,8,power_law_1.2,0.06288639903068542
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,6144,16384,2,8,4,8,power_law_1.2,0.04199680089950562
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,6144,16384,2,8,4,8,power_law_1.2,0.258188796043396
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,6144,16384,2,8,8,4,balanced,0.06692266464233398
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,6144,16384,2,8,8,4,balanced,0.04791999856630961
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,6144,16384,2,8,4,8,power_law_1.2,0.04221439957618713
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,6144,16384,2,8,4,8,power_law_1.2,0.06974080204963684
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,6144,16384,2,8,4,8,power_law_1.2,0.2647871971130371
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,6144,16384,2,8,8,4,balanced,0.06713066498438518
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,6144,16384,2,8,4,8,power_law_1.2,0.045638400316238406
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,6144,16384,2,8,8,4,balanced,0.05072000126043955
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,6144,16384,2,8,4,8,power_law_1.2,0.07422720193862915
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,6144,16384,2,8,4,8,power_law_1.2,0.04645119905471802
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,6144,16384,2,8,4,8,power_law_1.2,0.4045567989349365
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,6144,16384,2,8,8,4,balanced,0.06862399975458781
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,6144,16384,2,8,4,8,power_law_1.2,0.0511680006980896
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,6144,16384,2,8,8,4,balanced,0.05161066850026449
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,6144,16384,2,8,4,8,power_law_1.2,0.08287360072135926
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,6144,16384,2,8,4,8,power_law_1.2,0.42352638244628904
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,6144,16384,2,8,4,8,power_law_1.2,0.051545602083206174
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,6144,16384,2,8,8,4,balanced,0.06844800213972728
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,6144,16384,2,8,8,4,balanced,0.05215999980767568
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,6144,16384,2,8,4,8,power_law_1.2,0.06546559929847717
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,6144,16384,2,8,4,8,power_law_1.2,0.6375232219696045
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,6144,16384,2,8,4,8,power_law_1.2,0.10354559421539307
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,6144,16384,2,8,8,4,balanced,0.06885333359241486
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,6144,16384,2,8,4,8,power_law_1.2,0.06748160123825073
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,6144,16384,2,8,8,4,balanced,0.0525439977645874
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,6144,16384,2,8,4,8,power_law_1.2,0.07804800271987915
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,6144,16384,2,8,4,8,power_law_1.2,0.733465576171875
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,6144,16384,2,8,4,8,power_law_1.2,0.11425919532775879
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,6144,16384,2,8,8,4,balanced,0.06890133519967397
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,6144,16384,2,8,8,4,balanced,0.052229334910710655
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,6144,16384,2,8,4,8,power_law_1.2,0.12143360376358033
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,6144,16384,2,8,4,8,power_law_1.2,1.201529598236084
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,6144,16384,2,8,8,4,balanced,0.06924800078074138
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,6144,16384,2,8,8,4,balanced,0.05297600229581197
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,6144,16384,2,8,4,8,power_law_1.2,0.16600320339202881
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,6144,16384,2,8,4,8,power_law_1.2,1.3871295928955079
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,6144,16384,2,8,4,8,power_law_1.2,0.06273279786109924
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,6144,16384,2,8,8,4,balanced,0.076773335536321
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,6144,16384,2,8,8,4,balanced,0.054133335749308266
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,6144,16384,2,8,4,8,power_law_1.2,0.17726720571517945
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,6144,16384,2,8,4,8,power_law_1.2,0.07279360294342041
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,6144,16384,2,8,4,8,power_law_1.2,2.2244672775268555
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,6144,16384,2,8,8,4,balanced,0.07051733136177063
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,6144,16384,2,8,8,4,balanced,0.05691199998060862
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,6144,16384,2,8,4,8,power_law_1.2,0.07708799839019775
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,6144,16384,2,8,4,8,power_law_1.2,0.24839680194854735
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,6144,16384,2,8,4,8,power_law_1.2,2.7452287673950195
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,6144,16384,2,8,4,8,power_law_1.2,0.09681919813156128
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,6144,16384,2,8,8,4,balanced,0.05513600011666616
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,6144,16384,2,8,8,4,balanced,0.07048533360163371
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,6144,16384,2,8,4,8,power_law_1.2,0.3433216094970703
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,6144,16384,2,8,4,8,power_law_1.2,3.86321907043457
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,6144,16384,2,8,8,4,balanced,0.05641599992911021
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,6144,16384,2,8,4,8,power_law_1.2,0.5043712139129639
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,6144,16384,2,8,8,4,balanced,0.07400000095367432
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,6144,16384,2,8,4,8,power_law_1.2,0.10101120471954346
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,6144,16384,2,8,8,4,balanced,0.05922666688760122
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,6144,16384,2,8,4,8,power_law_1.2,0.4974720001220703
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,6144,16384,2,8,8,4,balanced,0.09031466643015544
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,6144,16384,2,8,4,8,power_law_1.2,5.950246429443359
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,6144,16384,2,8,4,8,power_law_1.2,0.10831359624862671
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,6144,16384,2,8,8,4,balanced,0.07099733253320058
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,6144,16384,2,8,4,8,power_law_1.2,0.7183487892150879
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,6144,16384,2,8,8,4,balanced,0.09318400422732036
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,6144,16384,2,8,4,8,power_law_1.2,0.1395967960357666
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,6144,16384,2,8,8,4,balanced,0.07238933444023132
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,6144,16384,2,8,4,8,power_law_1.2,12.749171447753906
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,6144,16384,2,8,4,8,power_law_1.2,1.0003583908081055
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,6144,16384,2,8,8,4,balanced,0.08917867143948872
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,6144,16384,2,8,8,4,balanced,0.07416533430417378
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,6144,16384,2,8,4,8,power_law_1.2,1.4943103790283203
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,6144,16384,2,8,8,4,balanced,0.1108746627966563
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,6144,16384,2,8,4,8,power_law_1.2,0.16828800439834596
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,6144,16384,2,8,8,4,balanced,0.0867733359336853
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,6144,16384,2,8,4,8,power_law_1.2,2.016896057128906
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,6144,16384,2,8,4,8,power_law_1.2,0.19503359794616698
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,6144,16384,2,8,8,4,balanced,0.12498133381207784
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,6144,16384,2,8,8,4,balanced,0.0918293297290802
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,6144,16384,2,8,4,8,power_law_1.2,2.490483283996582
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,6144,16384,2,8,8,4,balanced,0.1532533367474874
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,6144,16384,2,8,8,4,balanced,0.12462400396664937
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,6144,16384,2,8,4,8,power_law_1.2,0.33330559730529785
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,6144,16384,2,8,4,8,power_law_1.2,3.8804481506347654
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,6144,16384,2,8,8,4,balanced,0.1890453298886617
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,6144,16384,2,8,4,8,power_law_1.2,0.3988095998764038
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,6144,16384,2,8,8,4,balanced,0.13991999626159668
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,6144,16384,2,8,4,8,power_law_1.2,0.6380671977996826
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,6144,16384,2,8,4,8,power_law_1.2,7.675981140136718
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,6144,16384,2,8,8,4,balanced,0.24844266970952353
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,6144,16384,2,8,4,8,power_law_1.2,0.7097407817840576
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,6144,16384,2,8,8,4,balanced,0.19490132729212442
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,6144,16384,2,8,8,4,balanced,0.2884053389231364
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,6144,16384,2,8,8,4,balanced,0.24198400974273682
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,6144,16384,2,8,4,8,power_law_1.2,1.1956352233886718
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,6144,16384,2,8,4,8,power_law_1.2,1.5428095817565919
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,6144,16384,2,8,8,4,balanced,0.4095199902852376
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,6144,16384,2,8,8,4,balanced,0.3433493375778198
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,6144,16384,2,8,4,8,power_law_1.2,2.131161689758301
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,6144,16384,2,8,8,4,balanced,0.03107200066248576
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,6144,16384,2,8,4,8,power_law_1.2,2.826860809326172
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,6144,16384,2,8,8,4,balanced,0.030965333183606465
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,6144,16384,2,8,8,4,balanced,0.41118399302164715
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,6144,16384,2,8,8,4,balanced,0.47335998217264813
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,6144,16384,2,8,4,8,power_law_1.2,3.688703918457031
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,6144,16384,2,8,8,4,balanced,0.04167999823888143
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,6144,16384,2,8,4,8,power_law_1.2,5.5060993194580075
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,6144,16384,2,8,8,4,balanced,0.045040001471837364
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,6144,16384,2,8,8,4,balanced,0.6926133632659912
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,6144,16384,2,8,8,4,balanced,0.5966933170954386
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,6144,16384,2,8,4,8,power_law_1.2,11.92376937866211
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,6144,16384,2,8,8,4,balanced,0.045706664522488914
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,6144,16384,2,8,8,4,balanced,0.04594666759173075
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,6144,16384,2,8,8,4,balanced,0.04679466784000397
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,6144,16384,2,8,8,4,balanced,0.7783199946085612
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,6144,16384,2,8,8,4,balanced,0.9158186912536621
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,6144,16384,2,8,8,4,power_law_1.01,0.06932479739189149
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,6144,16384,2,8,8,4,balanced,0.046709333856900535
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,6144,16384,2,8,8,4,power_law_1.01,0.057158398628234866
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,6144,16384,2,8,8,4,power_law_1.01,0.06037759780883789
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,6144,16384,2,8,8,4,power_law_1.01,0.06591359972953796
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,6144,16384,2,8,8,4,balanced,0.9637440045674642
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,6144,16384,2,8,8,4,balanced,1.1410293579101562
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,6144,16384,2,8,8,4,power_law_1.01,0.06686720252037048
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,6144,16384,2,8,8,4,balanced,0.05023466547330221
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,6144,16384,2,8,8,4,power_law_1.01,0.06908800005912781
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,6144,16384,2,8,8,4,balanced,0.05186666548252106
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,6144,16384,2,8,8,4,power_law_1.01,0.07437440156936645
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,6144,16384,2,8,8,4,power_law_1.01,0.07463039755821228
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,6144,16384,2,8,8,4,power_law_1.01,0.07567359805107117
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,6144,16384,2,8,8,4,balanced,1.5417653719584148
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,6144,16384,2,8,8,4,balanced,1.7793173789978027
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,6144,16384,2,8,8,4,power_law_1.01,0.04692479968070984
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,6144,16384,2,8,8,4,power_law_1.01,0.07622399926185608
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,6144,16384,2,8,8,4,power_law_1.01,0.04505600035190582
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,6144,16384,2,8,8,4,power_law_1.01,0.08013439774513245
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,6144,16384,2,8,8,4,power_law_1.01,0.045612800121307376
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,6144,16384,2,8,8,4,power_law_1.01,0.08979200124740601
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,6144,16384,2,8,8,4,balanced,0.04983466863632202
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,6144,16384,2,8,8,4,power_law_1.01,0.09572479724884034
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,6144,16384,2,8,8,4,power_law_1.01,0.04989440143108368
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,6144,16384,2,8,8,4,balanced,0.05085866649945577
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,6144,16384,2,8,8,4,power_law_1.01,0.11191680431365966
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,6144,16384,2,8,8,4,balanced,0.053743998209635414
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,6144,16384,2,8,8,4,power_law_1.01,0.05058559775352478
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,6144,16384,2,8,8,4,power_law_1.01,0.12531839609146117
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,6144,16384,2,8,8,4,balanced,0.05277866621812185
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,6144,16384,2,8,8,4,power_law_1.01,0.05445759892463684
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,6144,16384,2,8,8,4,power_law_1.01,0.13456000089645387
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,6144,16384,2,8,8,4,balanced,2.985904057820638
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,6144,16384,2,8,8,4,balanced,3.50712521870931
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,6144,16384,2,8,8,4,power_law_1.01,0.056992000341415404
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,6144,16384,2,8,8,4,power_law_1.01,0.12709759473800658
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,6144,16384,2,8,8,4,power_law_1.01,0.056992000341415404
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,6144,16384,2,8,8,4,power_law_1.01,0.18499200344085692
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,6144,16384,2,8,8,4,power_law_1.01,0.05790719985961914
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,6144,16384,2,8,8,4,power_law_1.01,0.20421760082244872
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,6144,16384,2,8,8,4,power_law_1.01,0.057792001962661745
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,6144,16384,2,8,8,4,balanced,0.062090665102005005
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,6144,16384,2,8,8,4,power_law_1.01,0.2502912044525146
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,6144,16384,2,8,8,4,power_law_1.01,0.06343039870262146
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,6144,16384,2,8,8,4,power_law_1.01,0.06715520024299622
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,6144,16384,2,8,8,4,balanced,0.06330666442712148
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,6144,16384,2,8,8,4,power_law_1.01,0.31734399795532225
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,6144,16384,2,8,8,4,power_law_1.01,0.0673471987247467
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,6144,16384,2,8,8,4,balanced,0.06542400022347768
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,6144,16384,2,8,8,4,power_law_1.01,0.4520063877105713
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,6144,16384,2,8,8,4,power_law_1.01,0.07002879977226258
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,6144,16384,2,8,8,4,power_law_1.01,0.501855993270874
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,6144,16384,2,8,8,4,balanced,0.08563733100891113
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,6144,16384,2,8,8,4,power_law_1.01,0.08648319840431214
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,6144,16384,2,8,8,4,power_law_1.01,0.8822527885437011
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,6144,16384,2,8,8,4,balanced,0.09236266215642293
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,6144,16384,2,8,8,4,power_law_1.01,0.10152959823608398
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,6144,16384,2,8,8,4,power_law_1.01,1.2828031539916993
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,6144,16384,2,8,8,4,power_law_1.01,0.09685760140419006
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,6144,16384,2,8,8,4,power_law_1.01,1.6972415924072266
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,6144,16384,2,8,8,4,power_law_1.01,0.1260607957839966
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,6144,16384,2,8,8,4,power_law_1.01,2.775884819030762
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,6144,16384,2,8,8,4,balanced,0.12358933687210083
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,6144,16384,2,8,8,4,power_law_1.01,0.15200639963150026
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,6144,16384,2,8,8,4,power_law_1.01,2.899897575378418
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,6144,16384,2,8,8,4,balanced,0.1471999982992808
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,6144,16384,2,8,8,4,power_law_1.01,0.215500807762146
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,6144,16384,2,8,8,4,power_law_1.01,4.353728103637695
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,6144,16384,2,8,8,4,power_law_1.01,0.2202752113342285
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,6144,16384,2,8,8,4,power_law_1.01,0.3627135992050171
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,6144,16384,2,8,8,4,power_law_1.01,9.477875518798829
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,6144,16384,2,8,8,4,power_law_1.01,0.5021247863769531
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,6144,16384,2,8,8,4,balanced,0.2125813364982605
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,6144,16384,2,8,8,4,power_law_1.01,0.6910912036895752
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,6144,16384,2,8,8,4,balanced,0.276799996693929
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,6144,16384,2,8,8,4,power_law_1.01,0.7765567779541016
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,6144,16384,2,8,8,4,power_law_1.01,1.1873023986816407
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,6144,16384,2,8,8,4,balanced,0.42309868335723877
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,6144,16384,2,8,8,4,power_law_1.01,1.5596287727355957
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,6144,16384,2,8,8,4,balanced,0.5549866755803426
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,6144,16384,2,8,8,4,power_law_1.01,1.9255807876586915
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,6144,16384,2,8,8,4,power_law_1.01,2.6736127853393556
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,6144,16384,2,8,8,4,balanced,0.833295981089274
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,6144,16384,2,8,8,4,power_law_1.01,6.705696105957031
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,6144,16384,2,8,8,4,balanced,1.1080533663431804
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,6144,16384,2,8,8,4,power_law_1.01,0.03758719861507416
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,6144,16384,2,8,8,4,balanced,1.3782720565795898
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,6144,16384,2,8,8,4,power_law_1.2,0.06652799844741822
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,6144,16384,2,8,8,4,power_law_1.01,0.035769599676132205
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,6144,16384,2,8,8,4,power_law_1.2,0.056934398412704465
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,6144,16384,2,8,8,4,power_law_1.01,0.03771519958972931
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,6144,16384,2,8,8,4,power_law_1.2,0.06032639741897583
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,6144,16384,2,8,8,4,power_law_1.2,0.04827519953250885
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,6144,16384,2,8,8,4,power_law_1.01,0.045184001326560974
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,6144,16384,2,8,8,4,power_law_1.2,0.06587520241737366
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,6144,16384,2,8,8,4,balanced,2.187978744506836
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,6144,16384,2,8,8,4,power_law_1.2,0.04510720074176788
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,6144,16384,2,8,8,4,power_law_1.01,0.04466559886932373
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,6144,16384,2,8,8,4,power_law_1.2,0.06721280217170715
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,6144,16384,2,8,8,4,power_law_1.2,0.04670720100402832
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,6144,16384,2,8,8,4,power_law_1.01,0.050732797384262084
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,6144,16384,2,8,8,4,power_law_1.2,0.06692479848861695
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,6144,16384,2,8,8,4,power_law_1.2,0.07297279834747314
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,6144,16384,2,8,8,4,power_law_1.2,0.04979200065135956
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,6144,16384,2,8,8,4,power_law_1.01,0.0551360011100769
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,6144,16384,2,8,8,4,power_law_1.2,0.07335039973258972
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,6144,16384,2,8,8,4,power_law_1.01,0.06185600161552429
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,6144,16384,2,8,8,4,power_law_1.2,0.050246399641036985
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,6144,16384,2,8,8,4,power_law_1.2,0.07672320008277893
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,6144,16384,2,8,8,4,power_law_1.2,0.05372160077095032
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,6144,16384,2,8,8,4,power_law_1.01,0.06309760212898255
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,6144,16384,2,8,8,4,power_law_1.2,0.08168960213661194
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,6144,16384,2,8,8,4,power_law_1.2,0.05734400153160095
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,6144,16384,2,8,8,4,power_law_1.01,0.061375999450683595
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,6144,16384,2,8,8,4,power_law_1.2,0.08833919763565064
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,6144,16384,2,8,8,4,power_law_1.2,0.056576001644134524
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,6144,16384,2,8,8,4,balanced,4.34446398417155
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,6144,16384,2,8,8,4,power_law_1.2,0.09713280200958252
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,6144,16384,2,8,8,4,power_law_1.2,0.05815039873123169
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,6144,16384,2,8,8,4,power_law_1.2,0.09594879746437072
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,6144,16384,2,8,8,4,power_law_1.2,0.06090239882469177
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,6144,16384,2,8,8,4,power_law_1.01,0.05978879928588867
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,6144,16384,2,8,8,4,power_law_1.2,0.10000640153884888
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,6144,16384,2,8,8,4,power_law_1.2,0.06438400149345398
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,6144,16384,2,8,8,4,power_law_1.01,0.06633599996566772
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,6144,16384,2,8,8,4,power_law_1.2,0.11876480579376221
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,6144,16384,2,8,8,4,power_law_1.2,0.06615679860115051
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,6144,16384,2,8,8,4,power_law_1.01,0.06781439781188965
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,6144,16384,2,8,8,4,power_law_1.2,0.0712768018245697
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,6144,16384,2,8,8,4,power_law_1.2,0.14453760385513306
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,6144,16384,2,8,8,4,power_law_1.01,0.0785215973854065
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,6144,16384,2,8,8,4,power_law_1.2,0.07984640002250672
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,6144,16384,2,8,8,4,power_law_1.2,0.14556800127029418
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,6144,16384,2,8,8,4,power_law_1.2,0.0904640018939972
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,6144,16384,2,8,8,4,power_law_1.2,0.16824959516525267
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,6144,16384,2,8,8,4,power_law_1.01,0.08917760252952575
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,6144,16384,2,8,8,4,power_law_1.2,0.10221439599990845
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,6144,16384,2,8,8,4,power_law_1.2,0.2168639898300171
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,6144,16384,2,8,8,4,power_law_1.01,0.08625919818878174
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,6144,16384,2,8,8,4,power_law_1.2,0.09907839894294738
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,6144,16384,2,8,8,4,power_law_1.2,0.2529855966567993
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,6144,16384,2,8,16,2,balanced,0.04289066791534424
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,6144,16384,2,8,8,4,power_law_1.01,0.11074559688568116
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,6144,16384,2,8,8,4,power_law_1.2,0.12259839773178101
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,6144,16384,2,8,8,4,power_law_1.2,0.3237760066986084
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,6144,16384,2,8,8,4,power_law_1.01,0.13408000469207765
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,6144,16384,2,8,8,4,power_law_1.2,0.1610111951828003
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,6144,16384,2,8,8,4,power_law_1.2,0.501087999343872
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,6144,16384,2,8,16,2,balanced,0.04941866795221964
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,6144,16384,2,8,8,4,power_law_1.2,0.03976320028305054
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,6144,16384,2,8,8,4,power_law_1.01,0.15653120279312133
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,6144,16384,2,8,8,4,power_law_1.2,0.2239680051803589
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,6144,16384,2,8,16,2,balanced,0.06353599826494853
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,6144,16384,2,8,8,4,power_law_1.2,0.7275968074798584
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,6144,16384,2,8,8,4,power_law_1.2,0.036083200573921205
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,6144,16384,2,8,8,4,power_law_1.2,0.2654144048690796
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,6144,16384,2,8,16,2,balanced,0.06632000207901001
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,6144,16384,2,8,8,4,power_law_1.2,1.139673614501953
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,6144,16384,2,8,8,4,power_law_1.2,0.03986560106277466
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,6144,16384,2,8,8,4,power_law_1.01,0.25478401184082033
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,6144,16384,2,8,8,4,power_law_1.2,0.3740607976913452
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,6144,16384,2,8,16,2,balanced,0.0672159989674886
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,6144,16384,2,8,8,4,power_law_1.2,0.045516800880432126
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,6144,16384,2,8,8,4,power_law_1.2,1.234931182861328
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,6144,16384,2,8,8,4,power_law_1.01,0.3459199905395508
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,6144,16384,2,8,8,4,power_law_1.2,0.0457152009010315
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,6144,16384,2,8,16,2,balanced,0.06853866577148438
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,6144,16384,2,8,8,4,power_law_1.2,0.5084864139556885
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,6144,16384,2,8,8,4,power_law_1.2,0.05135999917984009
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,6144,16384,2,8,8,4,power_law_1.2,2.090540885925293
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,6144,16384,2,8,8,4,power_law_1.2,0.054150402545928955
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,6144,16384,2,8,16,2,balanced,0.06776000062624614
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,6144,16384,2,8,8,4,power_law_1.2,0.7553088188171386
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,6144,16384,2,8,8,4,power_law_1.01,0.5322879791259766
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,6144,16384,2,8,8,4,power_law_1.2,2.2536767959594726
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,6144,16384,2,8,8,4,power_law_1.2,0.05976960062980652
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,6144,16384,2,8,16,2,balanced,0.06916800141334534
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,6144,16384,2,8,8,4,power_law_1.2,0.9868351936340332
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,6144,16384,2,8,8,4,power_law_1.01,0.6188735961914062
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,6144,16384,2,8,8,4,power_law_1.2,3.4993152618408203
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,6144,16384,2,8,8,4,power_law_1.2,0.06056320071220398
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,6144,16384,2,8,16,2,balanced,0.06946666538715363
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,6144,16384,2,8,8,4,power_law_1.01,1.104851245880127
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,6144,16384,2,8,8,4,power_law_1.2,1.551763153076172
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,6144,16384,2,8,8,4,power_law_1.2,0.06624000072479248
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,6144,16384,2,8,8,4,power_law_1.2,5.22795524597168
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,6144,16384,2,8,16,2,balanced,0.06960000097751617
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,6144,16384,2,8,8,4,power_law_1.01,1.242790412902832
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,6144,16384,2,8,8,4,power_law_1.2,1.4949631690979004
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,6144,16384,2,8,16,2,balanced,0.07259200016657512
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,6144,16384,2,8,8,4,power_law_1.01,1.9447999954223634
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,6144,16384,2,8,8,4,power_law_1.2,1.8850688934326172
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,6144,16384,2,8,8,4,power_law_1.2,11.415264129638672
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,6144,16384,2,8,8,4,power_law_1.2,0.062105602025985716
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,6144,16384,2,8,16,2,balanced,0.07467733323574066
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,6144,16384,2,8,8,4,power_law_1.2,0.06958720088005066
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,6144,16384,2,8,8,4,power_law_1.01,3.505971145629883
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,6144,16384,2,8,8,4,power_law_1.2,3.35601921081543
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,6144,16384,2,8,16,2,balanced,0.07542400062084198
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,6144,16384,2,8,8,4,power_law_1.2,0.07264000177383423
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,6144,16384,2,8,8,4,power_law_1.2,0.08184319734573364
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,6144,16384,2,8,8,4,power_law_1.01,3.9260223388671873
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,6144,16384,2,8,16,2,balanced,0.07807466884454091
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,6144,16384,2,8,8,4,power_law_1.2,6.147430419921875
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,6144,16384,2,8,16,2,balanced,0.0881226658821106
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,6144,16384,2,8,8,4,power_law_1.01,6.147251129150391
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,6144,16384,2,8,8,4,power_law_1.2,0.08652160167694092
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,6144,16384,2,8,16,2,balanced,0.09025067090988159
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,6144,16384,2,8,8,4,power_law_1.2,0.09774720072746276
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,6144,16384,2,8,8,4,power_law_1.01,12.714361572265625
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,6144,16384,2,8,8,4,power_law_1.2,0.11148159503936768
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,6144,16384,2,8,16,2,balanced,0.09329066673914592
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,6144,16384,2,8,8,4,power_law_1.2,0.14053759574890137
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,6144,16384,2,8,16,2,balanced,0.1097813347975413
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,6144,16384,2,8,8,4,power_law_1.2,0.1817471981048584
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,6144,16384,2,8,16,2,balanced,0.035930665830771126
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,6144,16384,2,8,16,2,balanced,0.1350826621055603
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,6144,16384,2,8,8,4,power_law_1.2,0.2622015953063965
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,6144,16384,2,8,8,4,power_law_1.2,0.39479680061340333
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,6144,16384,2,8,16,2,balanced,0.15497600038846335
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,6144,16384,2,8,16,2,balanced,0.037834666669368744
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,6144,16384,2,8,16,2,balanced,0.04836800197760264
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,6144,16384,2,8,16,2,balanced,0.19485867023468018
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,6144,16384,2,8,8,4,power_law_1.2,0.5718976020812988
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,6144,16384,2,8,8,4,power_law_1.2,0.7446591854095459
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,6144,16384,2,8,16,2,balanced,0.05092266698678335
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,6144,16384,2,8,16,2,balanced,0.2642506758371989
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,6144,16384,2,8,8,4,power_law_1.2,1.0217472076416017
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,6144,16384,2,8,16,2,balanced,0.05299200117588043
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,6144,16384,2,8,8,4,power_law_1.2,1.5235584259033204
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,6144,16384,2,8,16,2,balanced,0.2878719965616862
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,6144,16384,2,8,16,2,balanced,0.053114667534828186
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,6144,16384,2,8,8,4,power_law_1.2,2.388006401062012
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,6144,16384,2,8,8,4,power_law_1.2,3.4603649139404298
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,6144,16384,2,8,16,2,balanced,0.05348266661167145
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,6144,16384,2,8,16,2,balanced,0.4149920145670573
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,6144,16384,2,8,8,4,power_law_1.2,4.894988632202148
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,6144,16384,2,8,16,2,balanced,0.05358933409055074
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,6144,16384,2,8,16,2,balanced,0.54202667872111
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,6144,16384,2,8,8,4,power_law_1.2,7.153766632080078
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,6144,16384,2,8,16,2,balanced,0.05366399884223938
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,6144,16384,2,8,8,4,power_law_1.2,11.279385375976563
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,6144,16384,2,8,16,2,balanced,0.0545066644748052
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,6144,16384,2,8,16,2,balanced,0.8023839791615804
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,6144,16384,2,8,16,2,balanced,0.05925333499908447
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,6144,16384,2,8,16,2,balanced,0.05750933289527893
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,6144,16384,2,8,16,2,balanced,0.058837334314982094
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,6144,16384,2,8,16,2,balanced,1.0459520022074382
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,6144,16384,2,8,16,2,balanced,0.06244266529877981
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,6144,16384,2,8,16,2,balanced,0.06829333305358887
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,6144,16384,2,8,16,2,balanced,0.06940266489982605
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,6144,16384,2,8,16,2,balanced,0.029365333418051403
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,6144,16384,2,8,16,2,balanced,1.2999946276346843
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,6144,16384,2,8,16,2,balanced,0.07654400169849396
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,6144,16384,2,8,16,2,balanced,0.030949334303538006
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,6144,16384,2,8,16,2,balanced,0.09251733620961507
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,6144,16384,2,8,16,2,balanced,0.04252266883850098
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,6144,16384,2,8,16,2,balanced,0.10945066809654236
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,6144,16384,2,8,16,2,balanced,0.046069333950678505
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,6144,16384,2,8,16,2,balanced,0.1320799986521403
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,6144,16384,2,8,16,2,balanced,2.04201602935791
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,6144,16384,2,8,16,2,balanced,0.04641066491603851
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,6144,16384,2,8,16,2,balanced,0.15154133240381876
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,6144,16384,2,8,16,2,balanced,0.04713066418965658
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,6144,16384,2,8,16,2,balanced,0.21568532784779867
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,6144,16384,2,8,16,2,balanced,0.04855466882387797
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,6144,16384,2,8,16,2,balanced,0.26394667228062946
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,6144,16384,2,8,16,2,balanced,0.04860266546408335
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,6144,16384,2,8,16,2,balanced,0.37759466965993244
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,6144,16384,2,8,16,2,balanced,0.05317866802215576
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,6144,16384,2,8,16,2,balanced,0.4910879929860433
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,6144,16384,2,8,16,2,balanced,4.012639999389648
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,6144,16384,2,8,16,2,balanced,0.05397333204746246
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,6144,16384,2,8,16,2,power_law_1.01,0.04596480131149292
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,6144,16384,2,8,16,2,balanced,0.7105333010355631
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,6144,16384,2,8,16,2,power_law_1.01,0.05045120120048523
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,6144,16384,2,8,16,2,power_law_1.01,0.047891199588775635
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,6144,16384,2,8,16,2,power_law_1.01,0.06324480175971985
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,6144,16384,2,8,16,2,balanced,0.9301333427429199
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,6144,16384,2,8,16,2,power_law_1.01,0.06814079880714416
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,6144,16384,2,8,16,2,balanced,0.052784000833829246
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,6144,16384,2,8,16,2,power_law_1.01,0.06540799736976624
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,6144,16384,2,8,16,2,balanced,0.05505600074927012
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,6144,16384,2,8,16,2,balanced,1.151413361231486
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,6144,16384,2,8,16,2,power_law_1.01,0.0683135986328125
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,6144,16384,2,8,16,2,balanced,0.057717333237330117
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,6144,16384,2,8,16,2,balanced,0.05906666815280914
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,6144,16384,2,8,16,2,power_law_1.01,0.06984320282936096
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,6144,16384,2,8,16,2,power_law_1.01,0.07317759990692138
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,6144,16384,2,8,16,2,balanced,1.8401439984639485
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,6144,16384,2,8,16,2,power_law_1.01,0.07597439885139465
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,6144,16384,2,8,16,2,power_law_1.01,0.07537919878959656
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,6144,16384,2,8,16,2,power_law_1.01,0.08002560138702393
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,6144,16384,2,8,16,2,balanced,0.06963199873765309
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,6144,16384,2,8,16,2,power_law_1.01,0.08318719863891602
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,6144,16384,2,8,16,2,balanced,0.0717439999183019
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,6144,16384,2,8,16,2,power_law_1.01,0.0825215995311737
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,6144,16384,2,8,16,2,balanced,0.07772799829641978
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,6144,16384,2,8,16,2,power_law_1.01,0.11670399904251098
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,6144,16384,2,8,16,2,balanced,0.10225600004196167
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,6144,16384,2,8,16,2,power_law_1.01,0.1161728024482727
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,6144,16384,2,8,16,2,balanced,3.547034581502279
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,6144,16384,2,8,16,2,power_law_1.01,0.11984000205993653
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,6144,16384,2,8,16,2,balanced,0.11187733213106792
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,6144,16384,2,8,16,2,power_law_1.01,0.15360000133514404
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,6144,16384,2,8,16,2,power_law_1.01,0.1487615942955017
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,6144,16384,2,8,16,2,power_law_1.01,0.20746240615844727
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,6144,16384,2,8,16,2,power_law_1.01,0.2935935974121094
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,6144,16384,2,8,16,2,power_law_1.01,0.03731200098991394
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,6144,16384,2,8,16,2,power_law_1.01,0.3465280055999756
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,6144,16384,2,8,16,2,balanced,0.15711999932924905
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,6144,16384,2,8,16,2,power_law_1.01,0.03997440040111542
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,6144,16384,2,8,16,2,power_law_1.01,0.4554431915283203
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,6144,16384,2,8,16,2,balanced,0.20201599597930908
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,6144,16384,2,8,16,2,power_law_1.01,0.039526399970054624
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,6144,16384,2,8,16,2,power_law_1.01,0.03167999982833862
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,6144,16384,2,8,16,2,power_law_1.01,0.6373760223388671
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,6144,16384,2,8,16,2,balanced,0.30401066939036053
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,6144,16384,2,8,16,2,power_law_1.01,0.050169599056243894
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,6144,16384,2,8,16,2,power_law_1.01,0.03128319978713989
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,6144,16384,2,8,16,2,power_law_1.01,0.7553599834442138
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,6144,16384,2,8,16,2,power_law_1.01,0.05204480290412903
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,6144,16384,2,8,16,2,balanced,0.3910826841990153
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,6144,16384,2,8,16,2,power_law_1.01,0.04023039937019348
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,6144,16384,2,8,16,2,power_law_1.2,0.048614400625228885
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,6144,16384,2,8,16,2,power_law_1.01,1.1496383666992187
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,6144,16384,2,8,16,2,power_law_1.01,0.05305600166320801
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,6144,16384,2,8,16,2,power_law_1.01,0.045491200685501096
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,6144,16384,2,8,16,2,balanced,0.5807733138402303
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,6144,16384,2,8,16,2,power_law_1.2,0.04854399859905243
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,6144,16384,2,8,16,2,power_law_1.01,1.431167984008789
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,6144,16384,2,8,16,2,power_law_1.01,0.05424000024795532
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,6144,16384,2,8,16,2,power_law_1.01,0.04688000082969666
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,6144,16384,2,8,16,2,power_law_1.2,0.05238400101661682
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,6144,16384,2,8,16,2,power_law_1.01,1.9498687744140626
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,6144,16384,2,8,16,2,power_law_1.01,0.054585599899291994
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,6144,16384,2,8,16,2,power_law_1.01,0.0483711987733841
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,6144,16384,2,8,16,2,balanced,0.7537759939829508
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,6144,16384,2,8,16,2,power_law_1.2,0.0637503981590271
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,6144,16384,2,8,16,2,power_law_1.01,0.0546176016330719
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,6144,16384,2,8,16,2,power_law_1.01,3.2469760894775392
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,6144,16384,2,8,16,2,power_law_1.01,0.052985602617263795
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,6144,16384,2,8,16,2,power_law_1.2,0.06539520025253295
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,6144,16384,2,8,16,2,power_law_1.01,0.05772799849510193
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,6144,16384,2,8,16,2,power_law_1.01,0.055692797899246214
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,6144,16384,2,8,16,2,power_law_1.2,0.06601600050926208
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,6144,16384,2,8,16,2,balanced,1.1384639739990234
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,6144,16384,2,8,16,2,power_law_1.01,6.139385604858399
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,6144,16384,2,8,16,2,power_law_1.01,0.06179839968681335
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,6144,16384,2,8,16,2,power_law_1.2,0.06720640063285828
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,6144,16384,2,8,16,2,power_law_1.01,0.0643455982208252
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,6144,16384,2,8,16,2,power_law_1.2,0.038464000821113585
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,6144,16384,2,8,16,2,power_law_1.01,0.06165760159492493
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,6144,16384,2,8,16,2,power_law_1.2,0.06963199973106385
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,6144,16384,2,8,16,2,power_law_1.01,0.06787840127944947
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,6144,16384,2,8,16,2,balanced,1.5225760142008464
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,6144,16384,2,8,16,2,power_law_1.01,0.06058880090713501
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,6144,16384,2,8,16,2,power_law_1.2,0.03928320109844208
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,6144,16384,2,8,16,2,power_law_1.2,0.07189760208129883
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,6144,16384,2,8,16,2,power_law_1.01,0.07478399872779846
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,6144,16384,2,8,16,2,power_law_1.2,0.04103040099143982
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,6144,16384,2,8,16,2,power_law_1.2,0.07602559924125671
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,6144,16384,2,8,16,2,power_law_1.01,0.08413439989089966
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,6144,16384,2,8,16,2,power_law_1.2,0.04979200065135956
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,6144,16384,2,8,16,2,power_law_1.2,0.07351040244102477
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,6144,16384,2,8,16,2,power_law_1.01,0.06223999857902527
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,6144,16384,2,8,16,2,balanced,1.8945706685384114
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,6144,16384,2,8,16,2,power_law_1.01,0.08655359745025634
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,6144,16384,2,8,16,2,power_law_1.2,0.05192959904670715
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,6144,16384,2,8,16,2,power_law_1.2,0.078847998380661
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,6144,16384,2,8,16,2,power_law_1.01,0.06651520133018493
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,6144,16384,2,8,16,2,power_law_1.01,0.09342079758644103
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,6144,16384,2,8,16,2,power_law_1.2,0.05281280279159546
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,6144,16384,2,8,16,2,power_law_1.2,0.07995520234107971
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,6144,16384,2,8,16,2,power_law_1.01,0.06931840181350708
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,6144,16384,2,8,16,2,power_law_1.2,0.053452801704406736
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,6144,16384,2,8,16,2,power_law_1.01,0.11260160207748413
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,6144,16384,2,8,16,2,power_law_1.2,0.09472000002861022
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,6144,16384,2,8,16,2,power_law_1.01,0.07938560247421264
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,6144,16384,2,8,16,2,power_law_1.2,0.05338240265846252
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,6144,16384,2,8,16,2,power_law_1.2,0.10161279439926148
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,6144,16384,2,8,16,2,power_law_1.01,0.1294592022895813
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,6144,16384,2,8,16,2,balanced,3.012613296508789
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,6144,16384,2,8,16,2,power_law_1.2,0.055692797899246214
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,6144,16384,2,8,16,2,power_law_1.2,0.12003840208053589
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,6144,16384,2,8,16,2,power_law_1.01,0.1810431957244873
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,6144,16384,2,8,16,2,power_law_1.2,0.0574783980846405
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,6144,16384,2,8,16,2,power_law_1.01,0.08736000061035157
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,6144,16384,2,8,16,2,power_law_1.2,0.12637439966201783
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,6144,16384,2,8,16,2,power_law_1.01,0.2052544116973877
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,6144,16384,2,8,16,2,power_law_1.2,0.057785600423812866
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,6144,16384,2,8,16,2,power_law_1.01,0.09756159782409668
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,6144,16384,2,8,16,2,power_law_1.2,0.15310720205307007
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,6144,16384,2,8,16,2,power_law_1.01,0.28256640434265134
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,6144,16384,2,8,16,2,power_law_1.2,0.06461439728736877
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,6144,16384,2,8,16,2,power_law_1.2,0.1510591983795166
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,6144,16384,2,8,16,2,power_law_1.01,0.11017600297927857
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,6144,16384,2,8,16,2,power_law_1.01,0.37523200511932375
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,6144,16384,2,8,16,2,power_law_1.2,0.07136639952659607
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,6144,16384,2,8,16,2,power_law_1.01,0.1429311990737915
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,6144,16384,2,8,16,2,power_law_1.2,0.21902079582214357
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,6144,16384,2,8,16,2,power_law_1.01,0.49818878173828124
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,6144,16384,2,8,16,2,power_law_1.2,0.06817280054092408
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,6144,16384,2,8,16,2,power_law_1.2,0.28917760848999025
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,6144,16384,2,8,16,2,power_law_1.01,0.1614016056060791
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,6144,16384,2,8,16,2,power_law_1.01,0.7427135944366455
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,6144,16384,2,8,16,2,power_law_1.2,0.0856768012046814
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,6144,16384,2,8,16,2,power_law_1.2,0.36971518993377683
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,6144,16384,2,8,16,2,balanced,6.011749267578125
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,6144,16384,2,8,16,2,power_law_1.01,1.0516032218933105
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,6144,16384,2,8,16,2,power_law_1.2,0.0898688018321991
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,6144,16384,2,8,16,2,power_law_1.2,0.45693440437316896
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,6144,16384,2,8,16,2,power_law_1.2,0.09032319784164429
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,6144,16384,2,8,16,2,power_law_1.01,1.3044351577758788
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,6144,16384,2,8,16,2,power_law_1.01,0.2342655897140503
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,6144,16384,2,8,16,2,power_law_1.2,0.6971392154693603
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,6144,16384,2,8,16,2,power_law_1.2,0.11200000047683716
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,6144,16384,2,8,16,2,power_law_1.01,1.5174336433410645
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,6144,16384,2,8,16,2,power_law_1.01,0.287558388710022
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,6144,16384,2,8,16,2,power_law_1.2,0.8741888046264649
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,6144,16384,2,8,16,2,power_law_1.2,0.13359999656677246
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,6144,16384,2,8,16,2,power_law_1.01,0.44245758056640627
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,6144,16384,2,8,16,2,power_law_1.01,2.5015167236328124
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,6144,16384,2,8,16,2,power_law_1.2,1.3269887924194337
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,6144,16384,2,8,16,2,power_law_1.2,0.18252160549163818
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,6144,16384,2,8,16,2,power_law_1.01,0.6642496109008789
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,6144,16384,2,8,16,2,power_law_1.01,5.833280181884765
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,6144,16384,2,8,16,2,power_law_1.2,0.222707200050354
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,6144,16384,2,8,16,2,power_law_1.2,1.8685375213623048
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,6144,16384,2,8,16,2,power_law_1.01,0.8817983627319336
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,6144,16384,2,8,16,2,power_law_1.2,0.3143167972564697
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,6144,16384,2,8,16,2,power_law_1.2,2.2534271240234376
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,6144,16384,2,8,16,2,power_law_1.01,0.9812031745910644
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,6144,16384,2,8,16,2,power_law_1.2,0.39266560077667234
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,6144,16384,2,8,16,2,power_law_1.2,0.033632001280784606
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,6144,16384,2,8,16,2,power_law_1.01,1.5059776306152344
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,6144,16384,2,8,16,2,power_law_1.2,2.7142335891723635
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,6144,16384,2,8,16,2,power_law_1.2,0.5429759979248047
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,6144,16384,2,8,16,2,power_law_1.2,0.03351039886474609
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,6144,16384,2,8,16,2,power_law_1.01,2.6557567596435545
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,6144,16384,2,8,16,2,power_law_1.2,0.03462400138378143
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,6144,16384,2,8,16,2,power_law_1.2,0.7191103935241699
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,6144,16384,2,8,16,2,power_law_1.2,6.867769622802735
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,6144,16384,2,8,16,2,power_law_1.2,0.04604800045490265
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,6144,16384,2,8,16,2,power_law_1.01,2.4460351943969725
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,6144,16384,2,8,16,2,power_law_1.2,0.04647040069103241
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,6144,16384,2,8,16,2,power_law_1.2,1.1001279830932618
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,6144,16384,2,8,16,2,power_law_1.2,0.04854399859905243
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,6144,16384,2,8,16,2,power_law_1.01,4.827430343627929
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,6144,16384,2,8,16,2,power_law_1.2,1.4071871757507324
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,6144,16384,2,8,16,2,power_law_1.2,0.05353599786758423
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,6144,16384,2,8,16,2,power_law_1.2,0.06047359704971313
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,6144,16384,2,8,16,2,power_law_1.2,1.9489919662475585
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,6144,16384,2,8,16,2,power_law_1.01,9.787769317626953
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,6144,16384,2,8,16,2,power_law_1.2,2.9402624130249024
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,6144,16384,2,8,16,2,power_law_1.2,0.06332160234451294
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,6144,16384,2,8,16,2,power_law_1.2,0.06429439783096313
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,6144,16384,2,8,16,2,power_law_1.2,4.863091278076172
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,6144,16384,2,8,16,2,power_law_1.2,0.06572800278663635
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,6144,16384,2,8,16,2,power_law_1.2,0.06537600159645081
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,6144,16384,2,8,16,2,power_law_1.2,0.06792960166931153
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,6144,16384,2,8,16,2,power_law_1.2,0.07862399816513062
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,6144,16384,2,8,16,2,power_law_1.2,0.08983680009841918
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,6144,16384,2,8,16,2,power_law_1.2,0.09164800047874451
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,6144,16384,2,8,16,2,power_law_1.2,0.11002880334854126
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,6144,16384,2,8,16,2,power_law_1.2,0.1482624053955078
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,6144,16384,2,8,16,2,power_law_1.2,0.16238080263137816
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,6144,16384,2,8,32,1,balanced,0.048842668533325195
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,6144,16384,2,8,16,2,power_law_1.2,0.24240639209747314
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,6144,16384,2,8,32,1,balanced,0.0497920016447703
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,6144,16384,2,8,16,2,power_law_1.2,0.3307391881942749
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,6144,16384,2,8,16,2,power_law_1.2,0.5166399955749512
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,6144,16384,2,8,32,1,balanced,0.06268266836802165
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,6144,16384,2,8,16,2,power_law_1.2,0.591321611404419
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,6144,16384,2,8,32,1,balanced,0.0658079981803894
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,6144,16384,2,8,16,2,power_law_1.2,1.0425984382629394
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,6144,16384,2,8,32,1,balanced,0.06724800169467926
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,6144,16384,2,8,16,2,power_law_1.2,1.3466879844665527
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,6144,16384,2,8,16,2,power_law_1.2,1.6838272094726563
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,6144,16384,2,8,32,1,balanced,0.06809066732724507
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,6144,16384,2,8,16,2,power_law_1.2,2.1979583740234374
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,6144,16384,2,8,32,1,balanced,0.06901333232720692
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,6144,16384,2,8,16,2,power_law_1.2,3.010675239562988
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,6144,16384,2,8,32,1,balanced,0.06860800087451935
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,6144,16384,2,8,16,2,power_law_1.2,5.422956848144532
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,6144,16384,2,8,32,1,balanced,0.06960000097751617
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,6144,16384,2,8,16,2,power_law_1.2,9.430675506591797
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,6144,16384,2,8,32,1,balanced,0.07041066884994507
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,6144,16384,2,8,32,1,balanced,0.08012799918651581
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,6144,16384,2,8,32,1,balanced,0.07559466858704884
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,6144,16384,2,8,32,1,balanced,0.0765173335870107
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,6144,16384,2,8,32,1,balanced,0.03790933390458425
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,6144,16384,2,8,32,1,balanced,0.08498133222262065
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,6144,16384,2,8,32,1,balanced,0.037989333271980286
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,6144,16384,2,8,32,1,balanced,0.08924266695976257
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,6144,16384,2,8,32,1,balanced,0.047610665361086525
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,6144,16384,2,8,32,1,balanced,0.09009599685668945
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,6144,16384,2,8,32,1,balanced,0.05142400165398916
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,6144,16384,2,8,32,1,balanced,0.10386666655540466
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,6144,16384,2,8,32,1,balanced,0.05246399839719137
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,6144,16384,2,8,32,1,balanced,0.12531200051307678
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,6144,16384,2,8,32,1,balanced,0.052383999029795326
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,6144,16384,2,8,32,1,balanced,0.14447466532389322
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,6144,16384,2,8,32,1,balanced,0.05306666592756907
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,6144,16384,2,8,32,1,balanced,0.173744002978007
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,6144,16384,2,8,32,1,balanced,0.05369600156943003
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,6144,16384,2,8,32,1,balanced,0.2309760053952535
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,6144,16384,2,8,32,1,balanced,0.054272000988324486
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,6144,16384,2,8,32,1,balanced,0.3129653334617615
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,6144,16384,2,8,32,1,balanced,0.05620799958705902
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,6144,16384,2,8,32,1,balanced,0.39900799592336017
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,6144,16384,2,8,32,1,balanced,0.05813866853713989
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,6144,16384,2,8,32,1,balanced,0.06112533311049143
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,6144,16384,2,8,32,1,balanced,0.5725706815719604
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,6144,16384,2,8,32,1,balanced,0.06299200157324474
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,6144,16384,2,8,32,1,balanced,0.06589866677920024
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,6144,16384,2,8,32,1,balanced,0.6783520380655924
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,6144,16384,2,8,32,1,balanced,0.07659733295440674
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,6144,16384,2,8,32,1,balanced,0.07718400160471599
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,6144,16384,2,8,32,1,balanced,0.9919306437174479
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,6144,16384,2,8,32,1,balanced,0.0888426701227824
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,6144,16384,2,8,32,1,balanced,0.10795199871063232
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,6144,16384,2,8,32,1,balanced,0.12107200423876445
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,6144,16384,2,8,32,1,balanced,1.3343626658121746
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,6144,16384,2,8,32,1,balanced,0.15291200081507364
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,6144,16384,2,8,32,1,balanced,0.2005066672960917
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,6144,16384,2,8,32,1,power_law_1.01,0.041945600509643556
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,6144,16384,2,8,32,1,balanced,1.6592159271240234
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,6144,16384,2,8,32,1,balanced,0.2783733407656352
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,6144,16384,2,8,32,1,power_law_1.01,0.04645119905471802
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,6144,16384,2,8,32,1,power_law_1.01,0.04769279956817627
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,6144,16384,2,8,32,1,balanced,0.35284801324208576
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,6144,16384,2,8,32,1,power_law_1.01,0.06399999856948853
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,6144,16384,2,8,32,1,power_law_1.01,0.06643199920654297
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,6144,16384,2,8,32,1,balanced,0.5055573383967081
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,6144,16384,2,8,32,1,balanced,2.562122662862142
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,6144,16384,2,8,32,1,power_law_1.01,0.06759679913520814
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,6144,16384,2,8,32,1,power_law_1.01,0.06965759992599488
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,6144,16384,2,8,32,1,balanced,0.6225653489430746
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,6144,16384,2,8,32,1,balanced,0.030938667555650074
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,6144,16384,2,8,32,1,power_law_1.01,0.0695360004901886
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,6144,16384,2,8,32,1,power_law_1.01,0.0698751986026764
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,6144,16384,2,8,32,1,balanced,0.03506666670242945
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,6144,16384,2,8,32,1,power_law_1.01,0.07288320064544677
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,6144,16384,2,8,32,1,balanced,0.8892587025960287
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,6144,16384,2,8,32,1,power_law_1.01,0.04120959937572479
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,6144,16384,2,8,32,1,balanced,0.04448533554871877
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,6144,16384,2,8,32,1,power_law_1.01,0.07746559977531434
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,6144,16384,2,8,32,1,balanced,0.048122664292653404
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,6144,16384,2,8,32,1,power_law_1.01,0.03709439933300018
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,6144,16384,2,8,32,1,power_law_1.01,0.07852799892425537
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,6144,16384,2,8,32,1,balanced,0.04929600159327189
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,6144,16384,2,8,32,1,power_law_1.01,0.04036479890346527
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,6144,16384,2,8,32,1,power_law_1.01,0.08058239817619324
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,6144,16384,2,8,32,1,balanced,1.2049706776936848
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,6144,16384,2,8,32,1,balanced,0.05029866596062978
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,6144,16384,2,8,32,1,balanced,5.065253257751465
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,6144,16384,2,8,32,1,power_law_1.2,0.04885759949684143
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,6144,16384,2,8,32,1,power_law_1.01,0.08922240138053894
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,6144,16384,2,8,32,1,power_law_1.01,0.04848000109195709
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,6144,16384,2,8,32,1,power_law_1.01,0.03227519989013672
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,6144,16384,2,8,32,1,balanced,0.05212266743183136
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,6144,16384,2,8,32,1,power_law_1.2,0.04508160054683685
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,6144,16384,2,8,32,1,power_law_1.01,0.050457602739334105
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,6144,16384,2,8,32,1,power_law_1.01,0.0939199984073639
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,6144,16384,2,8,32,1,balanced,0.05212800204753876
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,6144,16384,2,8,32,1,power_law_1.01,0.03409920036792755
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,6144,16384,2,8,32,1,power_law_1.2,0.04557439982891083
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,6144,16384,2,8,32,1,balanced,1.4942986170450847
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,6144,16384,2,8,32,1,power_law_1.01,0.11062400341033936
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,6144,16384,2,8,32,1,power_law_1.01,0.05377280116081238
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,6144,16384,2,8,32,1,power_law_1.2,0.06414719820022582
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,6144,16384,2,8,32,1,power_law_1.01,0.03623040020465851
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,6144,16384,2,8,32,1,power_law_1.2,0.06613119840621948
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,6144,16384,2,8,32,1,power_law_1.01,0.110316801071167
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,6144,16384,2,8,32,1,power_law_1.01,0.05567359924316406
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,6144,16384,2,8,32,1,power_law_1.01,0.047040000557899475
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,6144,16384,2,8,32,1,balanced,0.05619733532269796
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,6144,16384,2,8,32,1,power_law_1.2,0.06787199974060058
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,6144,16384,2,8,32,1,power_law_1.01,0.14986879825592042
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,6144,16384,2,8,32,1,power_law_1.01,0.055225598812103274
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,6144,16384,2,8,32,1,power_law_1.2,0.0697920024394989
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,6144,16384,2,8,32,1,power_law_1.01,0.04778240025043488
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,6144,16384,2,8,32,1,balanced,0.05752533177534739
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,6144,16384,2,8,32,1,power_law_1.2,0.0706496000289917
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,6144,16384,2,8,32,1,power_law_1.01,0.15208959579467773
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,6144,16384,2,8,32,1,power_law_1.01,0.055302399396896365
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,6144,16384,2,8,32,1,power_law_1.01,0.050393599271774295
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,6144,16384,2,8,32,1,power_law_1.2,0.07118080258369446
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,6144,16384,2,8,32,1,balanced,2.4157919883728027
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,6144,16384,2,8,32,1,power_law_1.2,0.0746944010257721
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,6144,16384,2,8,32,1,power_law_1.01,0.18027520179748535
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,6144,16384,2,8,32,1,power_law_1.01,0.056454402208328244
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,6144,16384,2,8,32,1,power_law_1.01,0.05311359763145447
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,6144,16384,2,8,32,1,power_law_1.2,0.0772607982158661
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,6144,16384,2,8,32,1,power_law_1.01,0.2458944082260132
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,6144,16384,2,8,32,1,power_law_1.01,0.058361601829528806
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,6144,16384,2,8,32,1,power_law_1.2,0.07922559976577759
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,6144,16384,2,8,32,1,power_law_1.01,0.055078399181365964
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,6144,16384,2,8,32,1,power_law_1.2,0.08075519800186157
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,6144,16384,2,8,32,1,power_law_1.01,0.3276479959487915
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,6144,16384,2,8,32,1,power_law_1.01,0.06175360083580017
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,6144,16384,2,8,32,1,power_law_1.2,0.09009919762611389
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,6144,16384,2,8,32,1,balanced,0.0621919979651769
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,6144,16384,2,8,32,1,power_law_1.2,0.09642879962921143
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,6144,16384,2,8,32,1,power_law_1.01,0.05664640069007874
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,6144,16384,2,8,32,1,power_law_1.01,0.41013121604919434
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,6144,16384,2,8,32,1,power_law_1.01,0.06458240151405334
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,6144,16384,2,8,32,1,power_law_1.2,0.096288001537323
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,6144,16384,2,8,32,1,balanced,0.06580266853173573
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,6144,16384,2,8,32,1,power_law_1.01,0.06372479796409607
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,6144,16384,2,8,32,1,power_law_1.2,0.1086016058921814
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,6144,16384,2,8,32,1,power_law_1.01,0.5839871883392334
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,6144,16384,2,8,32,1,power_law_1.01,0.06996480226516724
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,6144,16384,2,8,32,1,power_law_1.2,0.14491519927978516
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,6144,16384,2,8,32,1,balanced,0.06904000043869019
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,6144,16384,2,8,32,1,power_law_1.01,0.07836800217628478
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,6144,16384,2,8,32,1,power_law_1.01,0.7036863803863526
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,6144,16384,2,8,32,1,power_law_1.2,0.15058560371398927
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,6144,16384,2,8,32,1,balanced,0.07096000015735626
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,6144,16384,2,8,32,1,power_law_1.2,0.1771456003189087
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,6144,16384,2,8,32,1,power_law_1.01,0.08699520230293274
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,6144,16384,2,8,32,1,power_law_1.01,1.0192959785461426
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,6144,16384,2,8,32,1,power_law_1.01,0.0692799985408783
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,6144,16384,2,8,32,1,power_law_1.2,0.23751680850982665
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,6144,16384,2,8,32,1,balanced,4.688762664794922
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,6144,16384,2,8,32,1,power_law_1.01,0.0927616000175476
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,6144,16384,2,8,32,1,power_law_1.01,1.3550592422485352
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,6144,16384,2,8,32,1,power_law_1.2,0.31452159881591796
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,6144,16384,2,8,32,1,power_law_1.01,0.07280640006065368
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,6144,16384,2,8,32,1,power_law_1.2,0.40433921813964846
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,6144,16384,2,8,32,1,power_law_1.2,0.04080640077590943
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,6144,16384,2,8,32,1,power_law_1.01,0.12131199836730958
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,6144,16384,2,8,32,1,power_law_1.01,0.07555199861526489
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,6144,16384,2,8,32,1,balanced,0.08734400073687236
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,6144,16384,2,8,32,1,power_law_1.01,1.6856704711914063
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,6144,16384,2,8,32,1,power_law_1.2,0.5855296134948731
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,6144,16384,2,8,32,1,power_law_1.2,0.03640320003032684
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,6144,16384,2,8,32,1,power_law_1.01,0.1269503951072693
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,6144,16384,2,8,32,1,power_law_1.01,0.08233600258827209
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,6144,16384,2,8,32,1,power_law_1.2,0.7079999923706055
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,6144,16384,2,8,32,1,balanced,0.09148800373077393
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,6144,16384,2,8,32,1,power_law_1.01,2.5450368881225587
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,6144,16384,2,8,32,1,power_law_1.2,0.03806079924106598
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,6144,16384,2,8,32,1,power_law_1.2,1.018393611907959
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,6144,16384,2,8,32,1,power_law_1.01,0.15767680406570433
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,6144,16384,2,8,32,1,balanced,0.0999786655108134
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,6144,16384,2,8,32,1,power_law_1.2,1.3442367553710937
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,6144,16384,2,8,32,1,power_law_1.2,0.049619200825691226
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,6144,16384,2,8,32,1,power_law_1.01,0.0964352011680603
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,6144,16384,2,8,32,1,power_law_1.01,5.023468780517578
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,6144,16384,2,8,32,1,power_law_1.01,0.2033535957336426
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,6144,16384,2,8,32,1,balanced,0.1381439963976542
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,6144,16384,2,8,32,1,power_law_1.2,1.7038080215454101
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,6144,16384,2,8,32,1,power_law_1.2,0.05151360034942627
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,6144,16384,2,8,32,1,power_law_1.01,0.10273920297622681
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,6144,16384,2,8,32,1,power_law_1.01,0.2798912048339844
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,6144,16384,2,8,32,1,power_law_1.2,0.052825599908828735
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,6144,16384,2,8,32,1,balanced,0.16367999712626138
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,6144,16384,2,8,32,1,power_law_1.2,2.5389568328857424
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,6144,16384,2,8,32,1,power_law_1.01,0.11697920560836791
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,6144,16384,2,8,32,1,power_law_1.01,0.35976319313049315
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,6144,16384,2,8,32,1,power_law_1.2,0.054771202802658084
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,6144,16384,2,8,32,1,power_law_1.2,5.015814590454101
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,6144,16384,2,8,32,1,power_law_1.01,0.15199999809265136
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,6144,16384,2,8,32,1,power_law_1.2,0.055027198791503903
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,6144,16384,2,8,32,1,power_law_1.01,0.503872013092041
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,6144,16384,2,8,32,1,power_law_1.2,0.05572479963302612
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,6144,16384,2,8,32,1,power_law_1.01,0.1861631989479065
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,6144,16384,2,8,32,1,power_law_1.01,0.6303423881530762
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,6144,16384,2,8,32,1,power_law_1.2,0.05658239722251892
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,6144,16384,2,8,32,1,balanced,0.2558719913164775
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,6144,16384,2,8,32,1,power_law_1.2,0.05883520245552063
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,6144,16384,2,8,32,1,power_law_1.01,0.9080191612243652
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,6144,16384,2,8,32,1,power_law_1.01,0.27571840286254884
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,6144,16384,2,8,32,1,balanced,0.32416532437006634
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,6144,16384,2,8,32,1,power_law_1.2,0.06251519918441772
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,6144,16384,2,8,32,1,power_law_1.01,0.347379207611084
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,6144,16384,2,8,32,1,power_law_1.01,1.2095552444458009
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,6144,16384,2,8,32,1,balanced,0.46989866097768146
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,6144,16384,2,8,32,1,power_law_1.2,0.06410239934921265
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,6144,16384,2,8,32,1,power_law_1.01,0.4935935974121094
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,6144,16384,2,8,32,1,power_law_1.01,1.5297727584838867
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,6144,16384,2,8,32,1,power_law_1.2,0.07036799788475037
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,6144,16384,2,8,32,1,balanced,0.6160746812820435
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,6144,16384,2,8,32,1,power_law_1.2,0.07863039970397949
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,6144,16384,2,8,32,1,power_law_1.01,0.6393983840942383
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,6144,16384,2,8,32,1,power_law_1.01,2.436147117614746
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,6144,16384,2,8,32,1,power_law_1.2,0.08721920251846313
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,6144,16384,2,8,32,1,power_law_1.01,0.9253503799438476
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,6144,16384,2,8,32,1,balanced,0.9037973086039225
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,6144,16384,2,8,32,1,power_law_1.2,0.0915391981601715
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,6144,16384,2,8,32,1,power_law_1.01,4.6916545867919925
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,6144,16384,2,8,32,1,power_law_1.01,1.216659164428711
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,6144,16384,2,8,32,1,power_law_1.2,0.11626880168914795
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,6144,16384,2,8,32,1,balanced,1.1969813505808513
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,6144,16384,2,8,32,1,power_law_1.01,1.7985536575317382
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,6144,16384,2,8,32,1,power_law_1.2,0.1267135977745056
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,6144,16384,2,8,32,1,power_law_1.2,0.15615999698638916
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,6144,16384,2,8,32,1,power_law_1.01,2.384409523010254
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,6144,16384,2,8,32,1,balanced,1.7927893002827961
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,6144,16384,2,8,32,1,power_law_1.2,0.21136000156402587
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,6144,16384,2,8,32,1,power_law_1.01,2.9722879409790037
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,6144,16384,2,8,32,1,power_law_1.2,0.28046720027923583
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,6144,16384,2,8,32,1,power_law_1.2,0.36676480770111086
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,6144,16384,2,8,32,1,power_law_1.01,4.729625701904297
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,6144,16384,2,8,32,1,balanced,2.381765365600586
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,6144,16384,2,8,32,1,power_law_1.2,0.5091775894165039
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,6144,16384,2,8,32,1,power_law_1.2,0.6238336086273193
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,6144,16384,2,8,32,1,power_law_1.2,0.9033535957336426
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,6144,16384,2,8,32,1,power_law_1.01,9.399641418457032
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,6144,16384,2,8,32,1,power_law_1.2,1.2172351837158204
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,6144,16384,2,8,32,1,power_law_1.2,1.522169589996338
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,6144,16384,2,8,32,1,balanced,2.9637438456217446
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,6144,16384,2,8,32,1,power_law_1.2,2.4641536712646483
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,6144,16384,2,8,32,1,power_law_1.2,4.677971267700196
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,6144,16384,2,8,32,1,balanced,4.718085289001465
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,6144,16384,2,8,32,1,balanced,9.402362823486328
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,6144,16384,2,8,32,1,power_law_1.2,0.031225600838661195
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,6144,16384,2,8,32,1,power_law_1.2,0.03392640054225922
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,6144,16384,2,8,32,1,power_law_1.2,0.03429119884967804
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,6144,16384,2,8,32,1,power_law_1.2,0.04748800098896026
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,6144,16384,2,8,32,1,power_law_1.2,0.04834559857845307
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,6144,16384,2,8,32,1,power_law_1.2,0.051046401262283325
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,6144,16384,2,8,32,1,power_law_1.2,0.05245440006256104
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,6144,16384,2,8,32,1,power_law_1.2,0.054054397344589236
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,6144,16384,2,8,32,1,power_law_1.2,0.057529598474502563
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,6144,16384,2,8,32,1,power_law_1.2,0.06251519918441772
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,6144,16384,2,8,32,1,power_law_1.2,0.06901119947433472
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,6144,16384,2,8,32,1,power_law_1.2,0.07281919717788696
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,6144,16384,2,8,32,1,power_law_1.2,0.07514879703521729
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,6144,16384,2,8,32,1,power_law_1.2,0.08232319951057435
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,6144,16384,2,8,32,1,power_law_1.2,0.09826560020446777
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,6144,16384,2,8,32,1,power_law_1.2,0.10173439979553223
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,6144,16384,2,8,32,1,power_law_1.2,0.11324800252914428
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,6144,16384,2,8,32,1,power_law_1.2,0.1484544038772583
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,6144,16384,2,8,32,1,power_law_1.2,0.18606719970703126
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,6144,16384,2,8,32,1,power_law_1.2,0.2746239900588989
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,6144,16384,2,8,32,1,power_law_1.2,0.34917120933532714
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,6144,16384,2,8,32,1,power_law_1.2,0.49321599006652833
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,6144,16384,2,8,32,1,power_law_1.2,0.6405759811401367
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,6144,16384,2,8,32,1,power_law_1.2,0.9271552085876464
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,6144,16384,2,8,32,1,power_law_1.2,1.2008576393127441
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,7168,2048,8,256,1,32,balanced,0.07778133451938629
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,6144,16384,2,8,32,1,power_law_1.2,1.795577621459961
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,7168,2048,8,256,1,32,balanced,0.07659199833869934
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,6144,16384,2,8,32,1,power_law_1.2,2.3792064666748045
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,7168,2048,8,256,1,32,balanced,0.07659199833869934
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,7168,2048,8,256,1,32,balanced,0.08528000116348267
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,6144,16384,2,8,32,1,power_law_1.2,2.9743679046630858
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,7168,2048,8,256,1,32,balanced,0.12417067090670268
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,7168,2048,8,256,1,32,balanced,0.20678400993347168
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,6144,16384,2,8,32,1,power_law_1.2,4.727987289428711
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,7168,2048,8,256,1,32,balanced,0.20813866456349692
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,7168,2048,8,256,1,32,balanced,0.20680532852808634
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,6144,16384,2,8,32,1,power_law_1.2,9.390771484375
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,7168,2048,8,256,1,32,balanced,0.05226666728655497
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,7168,2048,8,256,1,32,balanced,0.20677866538365683
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,7168,2048,8,256,1,32,balanced,0.05952533086140951
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,7168,2048,8,256,1,32,balanced,0.20560532808303833
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,7168,2048,8,256,1,32,balanced,0.05232533315817515
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,7168,2048,8,256,1,32,balanced,0.2058239976565043
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,7168,2048,8,256,1,32,balanced,0.06771199901898702
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,7168,2048,8,256,1,32,balanced,0.2081013321876526
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,7168,2048,8,256,1,32,balanced,0.08747733632723491
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,7168,2048,8,256,1,32,balanced,0.12898133198420206
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,7168,2048,8,256,1,32,balanced,0.209114670753479
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,7168,2048,8,256,1,32,balanced,0.13057600458463034
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,7168,2048,8,256,1,32,balanced,0.2100480000178019
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,7168,2048,8,256,1,32,balanced,0.1318773329257965
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,7168,2048,8,256,1,32,power_law_1.01,0.205401611328125
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,7168,2048,8,256,1,32,balanced,0.13263466954231262
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,7168,2048,8,256,1,32,balanced,0.21620267629623413
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,7168,2048,8,256,1,32,balanced,0.13341866930325827
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,7168,2048,8,256,1,32,balanced,0.13495999574661255
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,7168,2048,8,256,1,32,power_law_1.01,0.20202240943908692
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,7168,2048,8,256,1,32,balanced,0.2156213323275248
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,7168,2048,8,256,1,32,balanced,0.1357493301232656
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,7168,2048,8,256,1,32,power_law_1.01,0.1441856026649475
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,7168,2048,8,256,1,32,balanced,0.21919999519983926
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,7168,2048,8,256,1,32,balanced,0.04953599969546
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,7168,2048,8,256,1,32,balanced,0.13794666528701782
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,7168,2048,8,256,1,32,balanced,0.13984533150990805
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,7168,2048,8,256,1,32,power_law_1.01,0.10824320316314698
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,7168,2048,8,256,1,32,balanced,0.04974400003751119
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,7168,2048,8,256,1,32,balanced,0.23468265930811563
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,7168,2048,8,256,1,32,balanced,0.14568533500035605
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,7168,2048,8,256,1,32,balanced,0.0488373339176178
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,7168,2048,8,256,1,32,power_law_1.01,0.14428160190582276
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,7168,2048,8,256,1,32,balanced,0.1476853291193644
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,7168,2048,8,256,1,32,balanced,0.24203733603159586
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,7168,2048,8,256,1,32,balanced,0.0674186646938324
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,7168,2048,8,256,1,32,balanced,0.15318399667739868
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,7168,2048,8,256,1,32,power_law_1.01,0.14958080053329467
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,7168,2048,8,256,1,32,balanced,0.08921066919962566
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,7168,2048,8,256,1,32,balanced,0.16449066996574402
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,7168,2048,8,256,1,32,balanced,0.25439467032750446
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,7168,2048,8,256,1,32,power_law_1.01,0.1945855975151062
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,7168,2048,8,256,1,32,balanced,0.1283466617266337
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,7168,2048,8,256,1,32,balanced,0.17481066783269247
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,7168,2048,8,256,1,32,balanced,0.12970667084058127
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,7168,2048,8,256,1,32,power_law_1.01,0.19853440523147584
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,7168,2048,8,256,1,32,balanced,0.28067199389139813
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,7168,2048,8,256,1,32,balanced,0.19819200038909912
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,7168,2048,8,256,1,32,balanced,0.13032000263532004
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,7168,2048,8,256,1,32,power_law_1.01,0.18211840391159057
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,7168,2048,8,256,1,32,balanced,0.1306880017121633
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,7168,2048,8,256,1,32,balanced,0.22249066829681396
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,7168,2048,8,256,1,32,power_law_1.01,0.19720319509506226
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,7168,2048,8,256,1,32,balanced,0.1316213309764862
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,7168,2048,8,256,1,32,balanced,0.3038880030314128
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,7168,2048,8,256,1,32,balanced,0.1325920025507609
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,7168,2048,8,256,1,32,power_law_1.01,0.19292160272598266
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,7168,2048,8,256,1,32,balanced,0.25755733251571655
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,7168,2048,8,256,1,32,balanced,0.13446399569511414
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,7168,2048,8,256,1,32,power_law_1.01,0.20040318965911866
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,7168,2048,8,256,1,32,balanced,0.13529599706331888
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,7168,2048,8,256,1,32,balanced,0.36554133892059326
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,7168,2048,8,256,1,32,power_law_1.01,0.20449280738830566
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,7168,2048,8,256,1,32,power_law_1.01,0.13123199939727784
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,7168,2048,8,256,1,32,balanced,0.3094506661097209
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,7168,2048,8,256,1,32,balanced,0.1376479963461558
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,7168,2048,8,256,1,32,power_law_1.01,0.22560639381408693
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,7168,2048,8,256,1,32,power_law_1.01,0.12410240173339844
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,7168,2048,8,256,1,32,balanced,0.14266133308410645
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,7168,2048,8,256,1,32,power_law_1.01,0.22851200103759767
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,7168,2048,8,256,1,32,power_law_1.01,0.1067199945449829
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,7168,2048,8,256,1,32,balanced,0.4226613442103068
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,7168,2048,8,256,1,32,balanced,0.14525333046913147
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,7168,2048,8,256,1,32,power_law_1.01,0.08300799727439881
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,7168,2048,8,256,1,32,balanced,0.3918293317159017
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,7168,2048,8,256,1,32,power_law_1.01,0.26307199001312254
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,7168,2048,8,256,1,32,balanced,0.14855999747912088
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,7168,2048,8,256,1,32,power_law_1.01,0.09065600037574768
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,7168,2048,8,256,1,32,power_law_1.01,0.26981120109558104
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,7168,2048,8,256,1,32,power_law_1.01,0.11310080289840699
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,7168,2048,8,256,1,32,power_law_1.01,0.32296319007873536
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,7168,2048,8,256,1,32,power_law_1.2,0.2182528018951416
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,7168,2048,8,256,1,32,power_law_1.01,0.13978879451751708
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,7168,2048,8,256,1,32,balanced,0.4703093369801839
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,7168,2048,8,256,1,32,power_law_1.01,0.11872639656066894
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,7168,2048,8,256,1,32,power_law_1.01,0.2937536001205444
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,7168,2048,8,256,1,32,power_law_1.2,0.20170879364013672
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,7168,2048,8,256,1,32,balanced,0.46671466032663983
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,7168,2048,8,256,1,32,power_law_1.01,0.12602239847183228
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,7168,2048,8,256,1,32,balanced,0.16087999939918518
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,7168,2048,8,256,1,32,power_law_1.01,0.12117760181427002
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,7168,2048,8,256,1,32,power_law_1.01,0.37010560035705564
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,7168,2048,8,256,1,32,power_law_1.2,0.09486719965934753
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,7168,2048,8,256,1,32,power_law_1.01,0.07322239875793457
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,7168,2048,8,256,1,32,power_law_1.01,0.11984000205993653
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,7168,2048,8,256,1,32,power_law_1.2,0.11284480094909669
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,7168,2048,8,256,1,32,power_law_1.01,0.3823807954788208
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,7168,2048,8,256,1,32,power_law_1.01,0.07621759772300721
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,7168,2048,8,256,1,32,power_law_1.01,0.12889599800109863
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,7168,2048,8,256,1,32,power_law_1.2,0.12876800298690796
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,7168,2048,8,256,1,32,power_law_1.01,0.09462400078773499
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,7168,2048,8,256,1,32,power_law_1.01,0.47528958320617676
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,7168,2048,8,256,1,32,power_law_1.2,0.1386240005493164
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,7168,2048,8,256,1,32,power_law_1.01,0.12567039728164672
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,7168,2048,8,256,1,32,power_law_1.01,0.11052800416946411
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,7168,2048,8,256,1,32,power_law_1.01,0.5963647842407227
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,7168,2048,8,256,1,32,balanced,0.6510506470998129
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,7168,2048,8,256,1,32,balanced,0.657535990079244
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,256,1,32,balanced,0.17307732502619425
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,7168,2048,8,256,1,32,power_law_1.2,0.18431999683380126
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,7168,2048,8,256,1,32,power_law_1.01,0.13013119697570802
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,7168,2048,8,256,1,32,power_law_1.01,0.1155776023864746
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,7168,2048,8,256,1,32,power_law_1.01,0.8214783668518066
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,7168,2048,8,256,1,32,power_law_1.2,0.18302079439163207
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,7168,2048,8,256,1,32,power_law_1.01,0.13871359825134277
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,7168,2048,8,256,1,32,power_law_1.01,0.1181439995765686
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,256,1,32,balanced,0.19366933902104697
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,7168,2048,8,256,1,32,power_law_1.01,1.013868808746338
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,7168,2048,8,256,1,32,power_law_1.01,0.1474303960800171
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,7168,2048,8,256,1,32,power_law_1.2,0.18018560409545897
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,7168,2048,8,256,1,32,power_law_1.01,0.11521919965744018
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,7168,2048,8,256,1,32,power_law_1.01,1.3750335693359375
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,256,1,32,balanced,0.20905067523320517
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,7168,2048,8,256,1,32,power_law_1.2,0.18763519525527955
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,7168,2048,8,256,1,32,power_law_1.01,0.15679359436035156
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,7168,2048,8,256,1,32,power_law_1.01,0.12275840044021606
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,7168,2048,8,256,1,32,power_law_1.01,1.8982719421386718
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,7168,2048,8,256,1,32,power_law_1.2,0.1931712031364441
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,7168,2048,8,256,1,32,power_law_1.01,0.16700799465179444
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,7168,2048,8,256,1,32,power_law_1.01,0.1386623978614807
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,7168,2048,8,256,1,32,power_law_1.2,0.21071360111236573
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,7168,2048,8,256,1,32,power_law_1.01,2.057542419433594
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,7168,2048,8,256,1,32,power_law_1.01,0.16833280324935912
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,7168,2048,8,256,1,32,power_law_1.01,0.13630720376968383
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,7168,2048,8,256,1,32,balanced,0.8334933121999105
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,7168,2048,8,256,1,32,balanced,0.8057440121968588
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,7168,2048,8,256,1,32,power_law_1.2,0.20648319721221925
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,7168,2048,8,256,1,32,power_law_1.01,0.1989184021949768
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,7168,2048,8,256,1,32,power_law_1.01,0.13880959749221802
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,7168,2048,8,256,1,32,power_law_1.01,3.387251281738281
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,7168,2048,8,256,1,32,power_law_1.2,0.22723839282989503
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,256,1,32,balanced,0.2540266712506612
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,7168,2048,8,256,1,32,power_law_1.01,0.1995136022567749
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,7168,2048,8,256,1,32,power_law_1.01,0.15633920431137086
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,7168,2048,8,256,1,32,power_law_1.2,0.27494399547576903
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,7168,2048,8,256,1,32,power_law_1.01,6.49130859375
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,7168,2048,8,256,1,32,power_law_1.01,0.26679680347442625
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,7168,2048,8,256,1,32,power_law_1.01,0.17087359428405763
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,7168,2048,8,256,1,32,power_law_1.2,0.291596794128418
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,7168,2048,8,256,1,32,power_law_1.01,0.2859519958496094
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,256,1,32,balanced,0.28676267464955646
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,7168,2048,8,256,1,32,power_law_1.2,0.2999743938446045
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,7168,2048,8,256,1,32,power_law_1.01,0.18367999792099
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,7168,2048,8,256,1,32,power_law_1.01,0.3442176103591919
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,7168,2048,8,256,1,32,power_law_1.2,0.3529344081878662
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,7168,2048,8,256,1,32,power_law_1.01,0.2134848117828369
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,7168,2048,8,256,1,32,power_law_1.2,0.3341952085494995
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,7168,2048,8,256,1,32,power_law_1.01,0.46257920265197755
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,256,1,32,balanced,0.41127467155456543
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,7168,2048,8,256,1,32,power_law_1.2,0.4540863990783691
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,7168,2048,8,256,1,32,power_law_1.01,0.5799808025360107
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,7168,2048,8,256,1,32,balanced,1.031066656112671
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,7168,2048,8,256,1,32,power_law_1.01,0.23766400814056396
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,7168,2048,8,256,1,32,balanced,0.9949599901835123
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,7168,2048,8,256,1,32,power_law_1.2,0.40577921867370603
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,7168,2048,8,256,1,32,power_law_1.01,0.7521215915679932
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,7168,2048,8,256,1,32,power_law_1.2,0.5411200046539306
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,7168,2048,8,256,1,32,power_law_1.01,1.0101119995117187
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,256,1,32,power_law_1.01,0.21380479335784913
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,256,1,32,balanced,0.49348799387613934
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,7168,2048,8,256,1,32,power_law_1.2,0.7299903869628906
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,7168,2048,8,256,1,32,power_law_1.01,1.4133376121520995
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,256,1,32,power_law_1.01,0.29463040828704834
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,7168,2048,8,256,1,32,power_law_1.2,0.9194815635681153
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,7168,2048,8,256,1,32,power_law_1.01,1.7888832092285156
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,256,1,32,power_law_1.01,0.36290559768676756
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,7168,2048,8,256,1,32,power_law_1.2,1.055577564239502
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,7168,2048,8,256,1,32,power_law_1.01,2.682841682434082
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,7168,2048,8,256,1,32,power_law_1.2,1.7583423614501954
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,256,1,32,power_law_1.01,0.4175871849060059
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,7168,2048,8,256,1,32,power_law_1.01,5.30376968383789
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,7168,2048,8,256,1,32,power_law_1.2,2.497337532043457
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,256,1,32,power_law_1.01,0.5713151931762696
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,7168,2048,8,256,1,32,power_law_1.2,2.9406848907470704
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,256,1,32,power_law_1.01,0.8484352111816407
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,256,1,32,power_law_1.01,1.0469440460205077
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,7168,2048,8,256,1,32,power_law_1.2,4.953408050537109
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,256,1,32,balanced,0.7275413672129313
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,7168,2048,8,256,1,32,balanced,1.6010133425394695
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,7168,2048,8,256,1,32,balanced,1.5373867352803547
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,256,1,32,power_law_1.01,1.5698176383972169
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,7168,2048,8,256,1,32,power_law_1.2,11.941785430908203
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,256,1,32,power_law_1.01,2.327289581298828
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,256,1,32,power_law_1.01,2.5236223220825194
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,256,1,32,power_law_1.01,4.419456100463867
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,256,1,32,balanced,0.947007973988851
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,256,1,32,power_law_1.01,9.59335708618164
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,256,1,32,balanced,1.1810186703999836
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,7168,2048,8,256,1,32,power_law_1.2,0.13154560327529907
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,7168,2048,8,256,1,32,power_law_1.2,0.12461440563201905
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,7168,2048,8,256,1,32,power_law_1.2,0.06410239934921265
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,7168,2048,8,256,1,32,power_law_1.2,0.08711680173873901
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,7168,2048,8,256,1,32,power_law_1.2,0.09584640264511109
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,7168,2048,8,256,1,32,power_law_1.2,0.09607040286064147
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,7168,2048,8,256,1,32,power_law_1.2,0.12300159931182861
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,7168,2048,8,256,1,32,power_law_1.2,0.1171455979347229
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,7168,2048,8,256,1,32,power_law_1.2,0.11720960140228272
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,7168,2048,8,256,1,32,balanced,3.1733118693033853
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,7168,2048,8,256,1,32,power_law_1.2,0.11679359674453735
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,7168,2048,8,256,1,32,power_law_1.2,0.12993919849395752
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,7168,2048,8,256,1,32,power_law_1.2,0.13054720163345337
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,7168,2048,8,256,1,32,balanced,3.0488694508870444
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,7168,2048,8,256,1,32,power_law_1.2,0.14447360038757323
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,256,1,32,balanced,1.8748373985290527
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,7168,2048,8,256,1,32,power_law_1.2,0.14651520252227784
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,7168,2048,8,256,1,32,power_law_1.2,0.16640000343322753
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,7168,2048,8,256,1,32,power_law_1.2,0.1873471975326538
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,7168,2048,8,256,1,32,power_law_1.2,0.18010239601135253
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,7168,2048,8,256,1,32,power_law_1.2,0.213753604888916
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,7168,2048,8,256,1,32,power_law_1.2,0.23098878860473632
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,7168,2048,8,256,1,32,power_law_1.2,0.27253758907318115
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,7168,2048,8,256,1,32,power_law_1.2,0.2891968011856079
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,7168,2048,8,256,1,32,power_law_1.2,0.4172351837158203
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,7168,2048,8,256,1,32,power_law_1.2,0.5286592006683349
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,7168,2048,8,256,1,32,power_law_1.2,0.6767807960510254
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,7168,2048,8,256,1,32,power_law_1.2,0.8793024063110352
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,7168,2048,8,256,1,32,power_law_1.2,1.2941951751708984
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,7168,2048,8,256,1,32,power_law_1.2,1.7184959411621095
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,7168,2048,8,256,1,32,power_law_1.2,2.223187255859375
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,7168,2048,8,256,1,32,power_law_1.2,3.0250688552856446
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,7168,2048,8,256,1,32,power_law_1.2,7.573996734619141
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,256,1,32,balanced,3.7386293411254883
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,7168,2048,8,256,1,32,power_law_1.2,0.14042880535125732
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,7168,2048,8,256,1,32,power_law_1.2,0.12634880542755128
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,7168,2048,8,256,1,32,power_law_1.2,0.060659199953079224
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,7168,2048,8,256,1,32,power_law_1.2,0.08263040184974671
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,7168,2048,8,256,1,32,power_law_1.2,0.08709120154380798
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,7168,2048,8,256,1,32,power_law_1.2,0.10539519786834717
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,7168,2048,8,256,1,32,power_law_1.2,0.12202240228652954
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,7168,2048,8,256,1,32,power_law_1.2,0.11539839506149292
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,7168,2048,8,256,1,32,power_law_1.2,0.12384639978408814
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,7168,2048,8,256,1,32,power_law_1.2,0.12478079795837402
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,7168,2048,8,256,2,16,balanced,0.053114667534828186
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,7168,2048,8,256,1,32,power_law_1.2,0.14012800455093383
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,7168,2048,8,256,2,16,balanced,0.06866666674613953
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,7168,2048,8,256,2,16,balanced,0.050623998045921326
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,7168,2048,8,256,1,32,power_law_1.2,0.14198399782180787
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,7168,2048,8,256,2,16,balanced,0.05979733169078827
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,7168,2048,8,256,2,16,balanced,0.05173333485921224
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,7168,2048,8,256,2,16,balanced,0.06534400085608165
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,7168,2048,8,256,1,32,power_law_1.2,0.14658559560775758
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,7168,2048,8,256,2,16,balanced,0.06805333495140076
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,7168,2048,8,256,2,16,balanced,0.08590933680534363
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,7168,2048,8,256,1,32,power_law_1.2,0.15773439407348633
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,7168,2048,8,256,2,16,balanced,0.08799466490745544
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,7168,2048,8,256,2,16,balanced,0.12585600217183432
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,7168,2048,8,256,1,32,power_law_1.2,0.1813696026802063
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,7168,2048,8,256,2,16,balanced,0.12916800379753113
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,7168,2048,8,256,2,16,balanced,0.20390933752059937
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,7168,2048,8,256,2,16,balanced,0.13134400049845377
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,7168,2048,8,256,1,32,power_law_1.2,0.19892480373382568
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,7168,2048,8,256,2,16,balanced,0.20578666528066
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,7168,2048,8,256,2,16,balanced,0.13247999548912048
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,7168,2048,8,256,1,32,power_law_1.2,0.22154879570007324
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,7168,2048,8,256,2,16,balanced,0.2051680088043213
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,7168,2048,8,256,2,16,balanced,0.13365866740544638
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,7168,2048,8,256,2,16,balanced,0.20467199881871542
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,7168,2048,8,256,2,16,balanced,0.13363200426101685
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,7168,2048,8,256,2,16,balanced,0.20562666654586792
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,7168,2048,8,256,1,32,power_law_1.2,0.25315840244293214
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,7168,2048,8,256,2,16,balanced,0.13537066181500754
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,7168,2048,8,256,2,16,balanced,0.20693333943684897
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,7168,2048,8,256,2,16,balanced,0.13634133338928223
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,7168,2048,8,256,2,16,balanced,0.20975999037424722
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,7168,2048,8,256,2,16,balanced,0.13829333583513895
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,7168,2048,8,256,2,16,balanced,0.21012266476949057
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,256,1,32,power_law_1.2,0.2491391897201538
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,7168,2048,8,256,2,16,balanced,0.04593066871166229
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,7168,2048,8,256,2,16,balanced,0.14028799533843994
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,7168,2048,8,256,2,16,balanced,0.21171732743581137
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,256,1,32,power_law_1.2,0.315775990486145
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,7168,2048,8,256,2,16,balanced,0.046997333566347756
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,7168,2048,8,256,2,16,balanced,0.1469439963499705
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,7168,2048,8,256,2,16,balanced,0.21688000361124674
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,256,1,32,power_law_1.2,0.3975872039794922
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,7168,2048,8,256,2,16,balanced,0.05003733436266581
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,7168,2048,8,256,2,16,balanced,0.14854400356610617
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,7168,2048,8,256,2,16,balanced,0.21766932805379233
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,7168,2048,8,256,2,16,balanced,0.06725866595904033
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,7168,2048,8,256,2,16,balanced,0.15387200315793356
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,7168,2048,8,256,2,16,balanced,0.2229386568069458
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,256,1,32,power_law_1.2,0.5631487846374512
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,7168,2048,8,256,2,16,balanced,0.09107733766237895
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,7168,2048,8,256,2,16,balanced,0.12770133217175803
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,7168,2048,8,256,2,16,balanced,0.16800532738367716
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,256,1,32,power_law_1.2,0.6776768207550049
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,7168,2048,8,256,2,16,balanced,0.23669866720835367
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,7168,2048,8,256,2,16,balanced,0.129530668258667
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,7168,2048,8,256,2,16,balanced,0.1786880095799764
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,256,1,32,power_law_1.2,1.0029760360717774
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,7168,2048,8,256,2,16,balanced,0.24876266717910767
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,7168,2048,8,256,2,16,balanced,0.12959999839464822
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,7168,2048,8,256,2,16,balanced,0.13131733735402426
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,256,1,32,power_law_1.2,1.271622371673584
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,7168,2048,8,256,2,16,balanced,0.20995734135309854
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,7168,2048,8,256,2,16,balanced,0.2646933396657308
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,7168,2048,8,256,2,16,balanced,0.13224533200263977
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,7168,2048,8,256,2,16,balanced,0.13451199730237326
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,7168,2048,8,256,2,16,balanced,0.23053866624832153
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,256,1,32,power_law_1.2,2.165088081359863
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,7168,2048,8,256,2,16,balanced,0.29075199365615845
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,7168,2048,8,256,2,16,balanced,0.13437333703041077
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,7168,2048,8,256,2,16,balanced,0.1372160017490387
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,256,1,32,power_law_1.2,3.0788991928100584
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,7168,2048,8,256,2,16,balanced,0.2727680007616679
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,7168,2048,8,256,2,16,balanced,0.3142933249473572
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,7168,2048,8,256,2,16,balanced,0.13962666193644205
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,256,1,32,power_law_1.2,3.2046207427978515
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,7168,2048,8,256,2,16,balanced,0.14563199877738953
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,7168,2048,8,256,2,16,power_law_1.01,0.1313024044036865
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,7168,2048,8,256,2,16,balanced,0.3302133282025655
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,7168,2048,8,256,2,16,balanced,0.3754826784133911
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,256,1,32,power_law_1.2,6.112774276733399
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,7168,2048,8,256,2,16,power_law_1.01,0.0876800000667572
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,7168,2048,8,256,2,16,balanced,0.1488533318042755
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,7168,2048,8,256,2,16,power_law_1.01,0.21145598888397216
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,7168,2048,8,256,2,16,balanced,0.15450132886568704
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,7168,2048,8,256,2,16,power_law_1.01,0.1314303994178772
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,7168,2048,8,256,2,16,power_law_1.01,0.08572160005569458
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,256,1,32,power_law_1.2,13.863136291503906
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,7168,2048,8,256,2,16,power_law_1.01,0.0833407998085022
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,7168,2048,8,256,2,16,balanced,0.41845866044362384
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,7168,2048,8,256,2,16,power_law_1.01,0.0955839991569519
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,7168,2048,8,256,2,16,balanced,0.44150932629903156
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,7168,2048,8,256,2,16,power_law_1.01,0.07789440155029297
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,7168,2048,8,256,2,16,power_law_1.01,0.12291840314865113
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,7168,2048,8,256,2,16,power_law_1.01,0.09111679792404175
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,7168,2048,8,256,2,16,power_law_1.01,0.14687999486923217
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,7168,2048,8,256,2,16,balanced,0.1718719998995463
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,7168,2048,8,256,2,16,power_law_1.01,0.1019968032836914
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,7168,2048,8,256,2,16,power_law_1.01,0.17883520126342772
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,7168,2048,8,256,2,16,balanced,0.5065546830495199
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,7168,2048,8,256,2,16,power_law_1.01,0.111353600025177
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,7168,2048,8,256,2,16,power_law_1.01,0.1801344037055969
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,7168,2048,8,256,2,16,balanced,0.5020586649576823
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,7168,2048,8,256,2,16,power_law_1.01,0.11631360054016113
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,7168,2048,8,256,2,16,power_law_1.01,0.18238719701766967
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,7168,2048,8,256,2,16,power_law_1.01,0.18605439662933348
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,7168,2048,8,256,2,16,power_law_1.01,0.12095999717712402
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,7168,2048,8,256,2,16,power_law_1.01,0.18968960046768188
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,7168,2048,8,256,2,16,power_law_1.01,0.12205439805984497
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,7168,2048,8,256,2,16,power_law_1.01,0.18815360069274903
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,7168,2048,8,256,2,16,power_law_1.01,0.1266111969947815
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,256,2,16,balanced,0.1888479987780253
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,7168,2048,8,256,2,16,balanced,0.7190133730570475
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,7168,2048,8,256,2,16,power_law_1.01,0.19692800045013428
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,7168,2048,8,256,2,16,balanced,0.7006879647572836
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,7168,2048,8,256,2,16,power_law_1.01,0.12784639596939087
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,7168,2048,8,256,2,16,power_law_1.01,0.21128320693969727
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,256,2,16,balanced,0.21369600296020508
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,7168,2048,8,256,2,16,power_law_1.01,0.12780799865722656
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,7168,2048,8,256,2,16,power_law_1.01,0.2235327959060669
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,7168,2048,8,256,2,16,power_law_1.01,0.09427840113639832
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,7168,2048,8,256,2,16,power_law_1.01,0.13954559564590455
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,7168,2048,8,256,2,16,power_law_1.01,0.22670719623565674
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,256,2,16,balanced,0.2320586641629537
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,7168,2048,8,256,2,16,power_law_1.01,0.13178880214691163
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,7168,2048,8,256,2,16,power_law_1.01,0.26715519428253176
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,7168,2048,8,256,2,16,power_law_1.01,0.14706560373306274
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,7168,2048,8,256,2,16,power_law_1.01,0.061536002159118655
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,7168,2048,8,256,2,16,power_law_1.01,0.29741439819335935
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,7168,2048,8,256,2,16,power_law_1.01,0.15587199926376344
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,7168,2048,8,256,2,16,power_law_1.01,0.0750656008720398
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,256,2,16,balanced,0.29891733328501385
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,7168,2048,8,256,2,16,power_law_1.01,0.2900991916656494
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,7168,2048,8,256,2,16,power_law_1.01,0.09071360230445862
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,7168,2048,8,256,2,16,power_law_1.01,0.16206079721450806
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,7168,2048,8,256,2,16,balanced,0.9189013640085856
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,7168,2048,8,256,2,16,power_law_1.01,0.10371840000152588
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,7168,2048,8,256,2,16,power_law_1.01,0.37594239711761473
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,7168,2048,8,256,2,16,power_law_1.01,0.19048320055007933
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,7168,2048,8,256,2,16,balanced,0.8921973705291748
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,7168,2048,8,256,2,16,power_law_1.01,0.11471999883651733
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,256,2,16,balanced,0.3542773326237996
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,7168,2048,8,256,2,16,power_law_1.01,0.20874240398406982
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,7168,2048,8,256,2,16,power_law_1.01,0.39015679359436034
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,7168,2048,8,256,2,16,power_law_1.01,0.11633280515670777
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,7168,2048,8,256,2,16,power_law_1.01,0.12388479709625244
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,7168,2048,8,256,2,16,power_law_1.01,0.24594559669494628
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,7168,2048,8,256,2,16,power_law_1.01,0.4551680088043213
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,7168,2048,8,256,2,16,power_law_1.01,0.12182400226593018
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,7168,2048,8,256,2,16,power_law_1.01,0.27808640003204343
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,7168,2048,8,256,2,16,power_law_1.01,0.1317247986793518
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,7168,2048,8,256,2,16,power_law_1.01,0.5396416187286377
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,7168,2048,8,256,2,16,power_law_1.01,0.3445312023162842
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,7168,2048,8,256,2,16,power_law_1.01,0.1357759952545166
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,256,2,16,balanced,0.5303306579589844
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,7168,2048,8,256,2,16,power_law_1.01,0.7330111980438232
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,7168,2048,8,256,2,16,power_law_1.01,0.14353280067443847
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,7168,2048,8,256,2,16,power_law_1.01,0.4289408206939697
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,7168,2048,8,256,2,16,power_law_1.01,0.1522879958152771
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,7168,2048,8,256,2,16,power_law_1.01,0.8738431930541992
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,7168,2048,8,256,2,16,power_law_1.01,0.6023359775543213
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,7168,2048,8,256,2,16,power_law_1.01,0.16698880195617677
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,7168,2048,8,256,2,16,power_law_1.01,1.0710720062255858
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,7168,2048,8,256,2,16,power_law_1.2,0.1307711958885193
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,7168,2048,8,256,2,16,power_law_1.01,0.18125439882278443
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,7168,2048,8,256,2,16,power_law_1.01,0.7575295925140381
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,7168,2048,8,256,2,16,balanced,1.1528586546579997
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,7168,2048,8,256,2,16,power_law_1.01,0.19392000436782836
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,256,2,16,balanced,0.6314239899317423
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,7168,2048,8,256,2,16,power_law_1.01,1.6221439361572265
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,7168,2048,8,256,2,16,power_law_1.2,0.21067519187927247
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,7168,2048,8,256,2,16,balanced,1.0967573324839275
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,7168,2048,8,256,2,16,power_law_1.01,1.089395236968994
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,7168,2048,8,256,2,16,power_law_1.2,0.07466880083084107
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,7168,2048,8,256,2,16,power_law_1.01,1.9589759826660156
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,7168,2048,8,256,2,16,power_law_1.01,1.3271231651306152
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,7168,2048,8,256,2,16,power_law_1.01,0.23847041130065919
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,7168,2048,8,256,2,16,power_law_1.2,0.09672319889068604
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,7168,2048,8,256,2,16,power_law_1.01,3.3838462829589844
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,7168,2048,8,256,2,16,power_law_1.2,0.10407040119171143
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,7168,2048,8,256,2,16,power_law_1.01,1.6657279968261718
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,7168,2048,8,256,2,16,power_law_1.2,0.13763200044631957
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,256,2,16,power_law_1.01,0.23671040534973145
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,7168,2048,8,256,2,16,power_law_1.01,2.5945152282714843
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,7168,2048,8,256,2,16,power_law_1.2,0.16695040464401245
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,7168,2048,8,256,2,16,power_law_1.01,5.901094436645508
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,256,2,16,balanced,0.917850653330485
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,256,2,16,power_law_1.01,0.2831104040145874
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,7168,2048,8,256,2,16,power_law_1.2,0.16822400093078613
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,256,2,16,power_law_1.01,0.3409663915634155
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,7168,2048,8,256,2,16,power_law_1.01,4.713459014892578
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,7168,2048,8,256,2,16,power_law_1.2,0.17498879432678222
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,256,2,16,power_law_1.01,0.4635647773742676
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,256,2,16,power_law_1.01,0.5735231876373291
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,7168,2048,8,256,2,16,power_law_1.2,0.18240640163421631
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,256,2,16,power_law_1.01,0.7639872074127197
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,7168,2048,8,256,2,16,power_law_1.2,0.18140799999237062
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,256,2,16,power_law_1.01,0.9656767845153809
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,7168,2048,8,256,2,16,power_law_1.2,0.189683198928833
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,256,2,16,power_law_1.01,1.4690879821777343
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,7168,2048,8,256,2,16,power_law_1.2,0.19820159673690796
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,7168,2048,8,256,2,16,balanced,1.7765119870503743
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,256,2,16,power_law_1.01,2.082054328918457
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,256,2,16,balanced,1.2035146554311116
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,7168,2048,8,256,2,16,power_law_1.2,0.2160128116607666
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,256,2,16,power_law_1.01,2.5394880294799806
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,7168,2048,8,256,2,16,balanced,1.703711986541748
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,7168,2048,8,256,2,16,power_law_1.2,0.23024001121520996
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,256,2,16,power_law_1.01,3.9258880615234375
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,7168,2048,8,256,2,16,power_law_1.2,0.24276480674743653
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,256,2,16,power_law_1.01,8.336946868896485
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,7168,2048,8,256,2,16,power_law_1.2,0.2810944080352783
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,7168,2048,8,256,2,16,power_law_1.2,0.3092031955718994
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,7168,2048,8,256,2,16,power_law_1.2,0.30395519733428955
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,7168,2048,8,256,2,16,power_law_1.2,0.3971712112426758
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,7168,2048,8,256,2,16,power_law_1.2,0.4544511795043945
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,256,2,16,balanced,1.4950559933980305
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,7168,2048,8,256,2,16,power_law_1.2,0.4941567897796631
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,7168,2048,8,256,2,16,power_law_1.2,0.6468287944793701
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,7168,2048,8,256,2,16,power_law_1.2,0.8464703559875488
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,7168,2048,8,256,2,16,power_law_1.2,0.9579071998596191
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,7168,2048,8,256,2,16,power_law_1.2,1.3517631530761718
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,7168,2048,8,256,2,16,power_law_1.2,2.1211328506469727
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,7168,2048,8,256,2,16,power_law_1.2,2.6899200439453126
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,7168,2048,8,256,2,16,power_law_1.2,4.147955322265625
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,7168,2048,8,256,2,16,power_law_1.2,8.352108764648438
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,256,2,16,balanced,2.364975929260254
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,7168,2048,8,256,2,16,balanced,3.510949452718099
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,7168,2048,8,256,2,16,balanced,3.3550186157226562
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,7168,2048,8,256,2,16,power_law_1.2,0.0833791971206665
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,7168,2048,8,256,2,16,power_law_1.2,0.1281280040740967
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,7168,2048,8,256,2,16,power_law_1.2,0.06083199977874756
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,7168,2048,8,256,2,16,power_law_1.2,0.07192959785461425
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,7168,2048,8,256,2,16,power_law_1.2,0.08698880076408386
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,7168,2048,8,256,2,16,power_law_1.2,0.09742720127105713
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,7168,2048,8,256,2,16,power_law_1.2,0.11441919803619385
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,7168,2048,8,256,2,16,power_law_1.2,0.12132480144500732
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,7168,2048,8,256,2,16,power_law_1.2,0.12095359563827515
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,256,2,16,balanced,4.698618570963542
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,7168,2048,8,256,2,16,power_law_1.2,0.1180799961090088
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,7168,2048,8,256,2,16,power_law_1.2,0.1193727970123291
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,7168,2048,8,256,2,16,power_law_1.2,0.12247680425643921
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,7168,2048,8,256,2,16,power_law_1.2,0.13890559673309327
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,7168,2048,8,256,2,16,power_law_1.2,0.14456959962844848
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,7168,2048,8,256,2,16,power_law_1.2,0.1572160005569458
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,7168,2048,8,256,2,16,power_law_1.2,0.16250879764556886
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,7168,2048,8,256,2,16,power_law_1.2,0.16776319742202758
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,7168,2048,8,256,2,16,power_law_1.2,0.20242559909820557
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,7168,2048,8,256,2,16,power_law_1.2,0.21646718978881835
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,7168,2048,8,256,2,16,power_law_1.2,0.2784895896911621
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,7168,2048,8,256,2,16,power_law_1.2,0.2919167995452881
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,7168,2048,8,256,2,16,power_law_1.2,0.3991296052932739
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,7168,2048,8,256,2,16,power_law_1.2,0.5158336162567139
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,7168,2048,8,256,2,16,power_law_1.2,0.6283648014068604
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,7168,2048,8,256,2,16,power_law_1.2,0.8606847763061524
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,7168,2048,8,256,2,16,power_law_1.2,1.353990364074707
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,7168,2048,8,256,2,16,power_law_1.2,1.5273856163024901
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,7168,2048,8,256,2,16,power_law_1.2,1.8967424392700196
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,7168,2048,8,256,2,16,power_law_1.2,0.09399679899215699
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,7168,2048,8,256,2,16,power_law_1.2,3.2297599792480467
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,7168,2048,8,256,2,16,power_law_1.2,0.11070079803466797
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,7168,2048,8,256,4,8,balanced,0.05574933191140493
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,7168,2048,8,256,2,16,power_law_1.2,0.058297598361968996
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,7168,2048,8,256,4,8,balanced,0.05968533456325531
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,7168,2048,8,256,2,16,power_law_1.2,7.636908721923828
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,7168,2048,8,256,2,16,power_law_1.2,0.07007359862327575
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,7168,2048,8,256,4,8,balanced,0.06356266637643178
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,7168,2048,8,256,2,16,power_law_1.2,0.0868224024772644
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,7168,2048,8,256,4,8,balanced,0.08724266290664673
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,7168,2048,8,256,4,8,balanced,0.12660266955693564
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,7168,2048,8,256,2,16,power_law_1.2,0.09093120098114013
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,7168,2048,8,256,4,8,balanced,0.2030506730079651
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,7168,2048,8,256,2,16,power_law_1.2,0.1141055941581726
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,7168,2048,8,256,4,8,balanced,0.210591991742452
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,7168,2048,8,256,2,16,power_law_1.2,0.12072960138320923
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,7168,2048,8,256,4,8,balanced,0.20710400740305582
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,7168,2048,8,256,2,16,power_law_1.2,0.12398079633712769
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,7168,2048,8,256,4,8,balanced,0.20851733287175497
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,7168,2048,8,256,4,8,balanced,0.048063998421033226
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,7168,2048,8,256,4,8,balanced,0.2095573345820109
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,7168,2048,8,256,2,16,power_law_1.2,0.12867200374603271
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,7168,2048,8,256,4,8,balanced,0.21067732572555542
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,7168,2048,8,256,2,16,power_law_1.2,0.13308160305023192
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,7168,2048,8,256,4,8,balanced,0.05320533116658529
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,7168,2048,8,256,4,8,balanced,0.21247466405232748
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,7168,2048,8,256,4,8,balanced,0.05276266733805338
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,7168,2048,8,256,2,16,power_law_1.2,0.14573440551757813
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,7168,2048,8,256,4,8,balanced,0.21523733933766684
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,7168,2048,8,256,4,8,balanced,0.07306133210659027
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,7168,2048,8,256,2,16,power_law_1.2,0.14606080055236817
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,7168,2048,8,256,4,8,balanced,0.21677867571512857
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,7168,2048,8,256,4,8,balanced,0.09114666779836018
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,7168,2048,8,256,2,16,power_law_1.2,0.15828479528427125
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,7168,2048,8,256,4,8,balanced,0.13361600041389465
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,7168,2048,8,256,4,8,balanced,0.22105065981547037
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,7168,2048,8,256,2,16,power_law_1.2,0.1739456057548523
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,7168,2048,8,256,4,8,balanced,0.13487999637921652
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,7168,2048,8,256,4,8,balanced,0.2238933245340983
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,7168,2048,8,256,2,16,power_law_1.2,0.19196159839630128
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,7168,2048,8,256,4,8,balanced,0.13648533821105957
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,7168,2048,8,256,4,8,balanced,0.22842667500178018
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,7168,2048,8,256,2,16,power_law_1.2,0.20945920944213867
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,7168,2048,8,256,4,8,balanced,0.13731200496355692
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,7168,2048,8,256,4,8,balanced,0.13769066333770752
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,7168,2048,8,256,4,8,balanced,0.24743467569351196
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,7168,2048,8,256,4,8,balanced,0.13929067055384317
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,7168,2048,8,256,4,8,balanced,0.25776533285776776
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,7168,2048,8,256,2,16,power_law_1.2,0.2408895969390869
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,7168,2048,8,256,4,8,balanced,0.14172266920407614
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,7168,2048,8,256,4,8,balanced,0.14306132992108664
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,7168,2048,8,256,4,8,balanced,0.2983306646347046
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,7168,2048,8,256,4,8,balanced,0.14597866932551065
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,256,2,16,power_law_1.2,0.2565119981765747
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,7168,2048,8,256,4,8,balanced,0.30875200033187866
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,7168,2048,8,256,4,8,balanced,0.15371200442314148
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,256,2,16,power_law_1.2,0.32099199295043945
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,7168,2048,8,256,4,8,balanced,0.157231996456782
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,256,2,16,power_law_1.2,0.3771712064743042
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,7168,2048,8,256,4,8,balanced,0.34851733843485516
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,7168,2048,8,256,4,8,balanced,0.1618933379650116
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,256,2,16,power_law_1.2,0.5564288139343262
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,7168,2048,8,256,4,8,balanced,0.1779306729634603
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,256,2,16,power_law_1.2,0.6642816066741943
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,7168,2048,8,256,4,8,balanced,0.40824000040690106
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,7168,2048,8,256,4,8,balanced,0.19780266284942627
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,256,2,16,power_law_1.2,1.0207488059997558
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,7168,2048,8,256,4,8,balanced,0.048165331284205117
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,7168,2048,8,256,4,8,power_law_1.01,0.08650879859924317
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,7168,2048,8,256,4,8,power_law_1.01,0.06483839750289917
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,256,2,16,power_law_1.2,1.406495952606201
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,7168,2048,8,256,4,8,balanced,0.22712000211079916
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,7168,2048,8,256,4,8,balanced,0.05082133412361145
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,7168,2048,8,256,4,8,power_law_1.01,0.12051199674606324
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,7168,2048,8,256,4,8,balanced,0.05586666862169901
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,256,2,16,power_law_1.2,1.8968191146850586
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,7168,2048,8,256,4,8,power_law_1.01,0.08297600150108338
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,7168,2048,8,256,4,8,balanced,0.5030826727549235
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,7168,2048,8,256,4,8,power_law_1.01,0.07786880135536194
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,7168,2048,8,256,4,8,balanced,0.2547360062599182
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,7168,2048,8,256,4,8,balanced,0.07197866837183635
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,7168,2048,8,256,4,8,power_law_1.01,0.09049599766731262
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,7168,2048,8,256,4,8,power_law_1.01,0.06367999911308289
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,7168,2048,8,256,4,8,power_law_1.01,0.11664639711380005
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,256,2,16,power_law_1.2,2.7858367919921876
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,7168,2048,8,256,4,8,balanced,0.09403199950853984
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,7168,2048,8,256,4,8,power_law_1.01,0.13043199777603148
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,7168,2048,8,256,4,8,power_law_1.01,0.06769279837608337
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,7168,2048,8,256,4,8,balanced,0.1367039978504181
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,7168,2048,8,256,4,8,balanced,0.30459733804066974
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,256,2,16,power_law_1.2,3.1532608032226563
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,7168,2048,8,256,4,8,power_law_1.01,0.17008639574050904
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,7168,2048,8,256,4,8,power_law_1.01,0.08451200127601624
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,7168,2048,8,256,4,8,balanced,0.13878400127092996
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,7168,2048,8,256,4,8,power_law_1.01,0.17363200187683106
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,7168,2048,8,256,4,8,balanced,0.5862453381220499
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,7168,2048,8,256,4,8,power_law_1.01,0.09674879908561707
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,7168,2048,8,256,4,8,balanced,0.13987200458844504
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,7168,2048,8,256,4,8,power_law_1.01,0.18855040073394774
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,256,2,16,power_law_1.2,4.705465698242188
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,7168,2048,8,256,4,8,balanced,0.37210134665171307
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,7168,2048,8,256,4,8,power_law_1.01,0.1695680022239685
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,7168,2048,8,256,4,8,balanced,0.14167466759681702
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,7168,2048,8,256,4,8,power_law_1.01,0.11329920291900634
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,7168,2048,8,256,4,8,power_law_1.01,0.19459199905395508
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,7168,2048,8,256,4,8,balanced,0.14172266920407614
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,7168,2048,8,256,4,8,power_law_1.01,0.11577600240707397
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,256,2,16,power_law_1.2,11.661408233642579
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,7168,2048,8,256,4,8,power_law_1.01,0.19103360176086426
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,7168,2048,8,256,4,8,balanced,0.14553067088127136
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,7168,2048,8,256,4,8,power_law_1.01,0.11902079582214356
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,7168,2048,8,256,4,8,power_law_1.01,0.19839999675750733
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,7168,2048,8,256,4,8,balanced,0.48503466447194415
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,7168,2048,8,256,4,8,power_law_1.01,0.20972158908843994
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,7168,2048,8,256,4,8,balanced,0.14621333281199136
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,7168,2048,8,256,4,8,power_law_1.01,0.12474240064620971
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,7168,2048,8,256,4,8,power_law_1.01,0.22551679611206055
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,7168,2048,8,256,4,8,balanced,0.14972266554832458
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,7168,2048,8,256,4,8,balanced,0.8125226497650146
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,7168,2048,8,256,4,8,power_law_1.01,0.12370560169219971
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,7168,2048,8,256,4,8,power_law_1.01,0.23503999710083007
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,7168,2048,8,256,4,8,power_law_1.01,0.24303359985351564
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,7168,2048,8,256,4,8,balanced,0.15292267004648843
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,7168,2048,8,256,4,8,power_law_1.01,0.13308160305023192
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,7168,2048,8,256,4,8,power_law_1.01,0.2871551990509033
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,7168,2048,8,256,4,8,power_law_1.01,0.1345088005065918
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,7168,2048,8,256,4,8,balanced,0.16173866391181946
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,7168,2048,8,256,4,8,power_law_1.01,0.29738240242004393
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,7168,2048,8,256,4,8,balanced,0.5902933279673258
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,7168,2048,8,256,4,8,power_law_1.01,0.13557759523391724
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,7168,2048,8,256,4,8,balanced,0.16523200273513794
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,7168,2048,8,256,4,8,power_law_1.01,0.37519359588623047
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,7168,2048,8,256,4,8,power_law_1.01,0.3568128108978271
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,7168,2048,8,256,4,8,power_law_1.01,0.15456000566482545
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,7168,2048,8,256,4,8,balanced,0.1735466718673706
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,7168,2048,8,256,4,8,power_law_1.01,0.4560256004333496
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,7168,2048,8,256,4,8,power_law_1.01,0.15504000186920167
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,7168,2048,8,256,4,8,power_law_1.01,0.5209472179412842
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,7168,2048,8,256,4,8,power_law_1.01,0.16946560144424438
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,7168,2048,8,256,4,8,power_law_1.01,0.6893375873565674
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,7168,2048,8,256,4,8,balanced,1.048847993214925
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,7168,2048,8,256,4,8,power_law_1.01,0.8542207717895508
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,7168,2048,8,256,4,8,power_law_1.01,0.196396803855896
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,7168,2048,8,256,4,8,balanced,0.8424800237019857
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,7168,2048,8,256,4,8,power_law_1.01,1.1614015579223633
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,7168,2048,8,256,4,8,balanced,0.19769599040349325
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,7168,2048,8,256,4,8,power_law_1.01,0.21210238933563233
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,7168,2048,8,256,4,8,power_law_1.01,1.5397503852844239
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,7168,2048,8,256,4,8,power_law_1.01,0.2575808048248291
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,7168,2048,8,256,4,8,power_law_1.01,1.9043840408325194
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,7168,2048,8,256,4,8,power_law_1.01,0.30915839672088624
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,7168,2048,8,256,4,8,power_law_1.01,3.0974912643432617
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,7168,2048,8,256,4,8,power_law_1.01,0.3745728015899658
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,7168,2048,8,256,4,8,power_law_1.01,0.0748416006565094
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,7168,2048,8,256,4,8,power_law_1.01,0.46611199378967283
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,7168,2048,8,256,4,8,power_law_1.01,6.62265625
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,7168,2048,8,256,4,8,power_law_1.01,0.6042304039001465
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,7168,2048,8,256,4,8,power_law_1.01,0.09452160000801087
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,256,4,8,balanced,0.22387200593948364
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,7168,2048,8,256,4,8,balanced,1.0770186583201091
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,7168,2048,8,256,4,8,power_law_1.01,0.7686399936676025
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,7168,2048,8,256,4,8,power_law_1.01,0.07182080149650574
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,7168,2048,8,256,4,8,balanced,1.3250133196512859
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,7168,2048,8,256,4,8,power_law_1.01,1.0785216331481933
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,7168,2048,8,256,4,8,power_law_1.01,0.07468159794807434
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,256,4,8,balanced,0.2678613265355428
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,7168,2048,8,256,4,8,power_law_1.01,1.4918208122253418
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,7168,2048,8,256,4,8,power_law_1.01,0.08164479732513427
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,256,4,8,balanced,0.30357333024342853
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,7168,2048,8,256,4,8,power_law_1.01,0.09775360226631165
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,7168,2048,8,256,4,8,power_law_1.01,1.7827327728271485
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,7168,2048,8,256,4,8,power_law_1.01,0.11681920289993286
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,7168,2048,8,256,4,8,power_law_1.01,2.6246335983276365
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,256,4,8,balanced,0.4150079886118571
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,7168,2048,8,256,4,8,power_law_1.01,0.11971839666366577
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,7168,2048,8,256,4,8,power_law_1.01,0.12783360481262207
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,7168,2048,8,256,4,8,power_law_1.01,5.323571014404297
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,256,4,8,balanced,0.4894133408864339
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,7168,2048,8,256,4,8,balanced,1.3707359631856282
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,7168,2048,8,256,4,8,power_law_1.01,0.12970880270004273
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,7168,2048,8,256,4,8,power_law_1.01,0.13603199720382692
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,7168,2048,8,256,4,8,power_law_1.01,0.14881279468536376
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,256,4,8,balanced,0.7234986623128256
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,7168,2048,8,256,4,8,power_law_1.01,0.14853760004043579
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,7168,2048,8,256,4,8,power_law_1.01,0.16201599836349487
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,7168,2048,8,256,4,8,balanced,2.023359934488932
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,7168,2048,8,256,4,8,power_law_1.01,0.16870399713516235
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,7168,2048,8,256,4,8,power_law_1.01,0.19397120475769042
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,256,4,8,balanced,0.8787573178609213
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,7168,2048,8,256,4,8,power_law_1.01,0.21253759860992433
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,7168,2048,8,256,4,8,power_law_1.01,0.2571455955505371
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,7168,2048,8,256,4,8,balanced,2.0860692660013833
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,256,4,8,balanced,1.2883093357086182
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,256,4,8,power_law_1.01,0.2631999969482422
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,7168,2048,8,256,4,8,power_law_1.2,0.08621439933776856
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,256,4,8,power_law_1.01,0.36449921131134033
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,7168,2048,8,256,4,8,power_law_1.2,0.11051520109176635
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,256,4,8,power_law_1.01,0.4264768123626709
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,256,4,8,power_law_1.01,0.5616447925567627
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,7168,2048,8,256,4,8,power_law_1.2,0.06588159799575806
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,256,4,8,power_law_1.01,0.7164159774780273
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,7168,2048,8,256,4,8,power_law_1.2,0.08109440207481385
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,256,4,8,power_law_1.01,0.9716863632202148
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,256,4,8,balanced,1.70252259572347
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,7168,2048,8,256,4,8,power_law_1.2,0.11043200492858887
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,256,4,8,power_law_1.01,1.2185024261474608
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,7168,2048,8,256,4,8,power_law_1.2,0.1198591947555542
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,256,4,8,power_law_1.01,1.7927488327026366
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,7168,2048,8,256,4,8,power_law_1.2,0.18105599880218506
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,256,4,8,power_law_1.01,2.4550975799560546
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,7168,2048,8,256,4,8,power_law_1.2,0.1622912049293518
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,7168,2048,8,256,4,8,power_law_1.2,0.1683776021003723
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,256,4,8,power_law_1.01,2.995942306518555
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,7168,2048,8,256,4,8,power_law_1.2,0.1712448000907898
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,256,4,8,power_law_1.01,4.6694591522216795
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,7168,2048,8,256,4,8,power_law_1.2,0.18636800050735475
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,7168,2048,8,256,4,8,power_law_1.2,0.19063680171966552
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,256,4,8,balanced,2.1230079332987466
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,256,4,8,power_law_1.01,10.466425323486328
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,7168,2048,8,256,4,8,power_law_1.2,0.20779519081115722
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,7168,2048,8,256,4,8,balanced,4.008458773295085
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,7168,2048,8,256,4,8,power_law_1.2,0.21052160263061523
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,7168,2048,8,256,4,8,power_law_1.2,0.2261568069458008
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,7168,2048,8,256,4,8,power_law_1.2,0.22702720165252685
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,7168,2048,8,256,4,8,power_law_1.2,0.274399995803833
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,7168,2048,8,256,4,8,power_law_1.2,0.30678400993347166
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,7168,2048,8,256,4,8,power_law_1.2,0.3084415912628174
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,7168,2048,8,256,4,8,balanced,4.134197235107422
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,7168,2048,8,256,4,8,power_law_1.2,0.3899199962615967
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,7168,2048,8,256,4,8,power_law_1.2,0.42118401527404786
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,7168,2048,8,256,4,8,power_law_1.2,0.5165376186370849
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,7168,2048,8,256,4,8,power_law_1.2,0.6094528198242187
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,256,4,8,balanced,3.3695732752482095
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,7168,2048,8,256,4,8,power_law_1.2,0.8077695846557618
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,7168,2048,8,256,4,8,power_law_1.2,0.9883135795593262
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,7168,2048,8,256,4,8,power_law_1.2,1.3196415901184082
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,7168,2048,8,256,4,8,power_law_1.2,1.5502464294433593
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,7168,2048,8,256,4,8,power_law_1.2,2.333286476135254
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,7168,2048,8,256,4,8,power_law_1.2,3.73070068359375
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,7168,2048,8,256,4,8,power_law_1.2,0.06490240097045899
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,7168,2048,8,256,4,8,power_law_1.2,0.0800383985042572
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,7168,2048,8,256,4,8,power_law_1.2,7.315577697753906
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,7168,2048,8,256,4,8,power_law_1.2,0.05368959903717041
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,7168,2048,8,256,4,8,power_law_1.2,0.06386560201644897
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,7168,2048,8,256,4,8,power_law_1.2,0.0780672013759613
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,7168,2048,8,256,4,8,power_law_1.2,0.09007999897003174
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,7168,2048,8,256,4,8,power_law_1.2,0.11151360273361206
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,7168,2048,8,256,4,8,power_law_1.2,0.12040319442749023
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,7168,2048,8,256,4,8,power_law_1.2,0.1178879976272583
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,7168,2048,8,256,4,8,power_law_1.2,0.12086399793624877
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,7168,2048,8,256,4,8,power_law_1.2,0.12578560113906861
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,7168,2048,8,256,4,8,power_law_1.2,0.1324671983718872
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,7168,2048,8,256,4,8,power_law_1.2,0.14044159650802612
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,7168,2048,8,256,4,8,power_law_1.2,0.1474560022354126
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,7168,2048,8,256,4,8,power_law_1.2,0.1500607967376709
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,256,4,8,balanced,6.718629201253255
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,7168,2048,8,256,4,8,power_law_1.2,0.15865600109100342
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,7168,2048,8,256,4,8,power_law_1.2,0.07445120215415954
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,7168,2048,8,256,4,8,power_law_1.2,0.17491840124130248
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,7168,2048,8,256,4,8,power_law_1.2,0.08979840278625488
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,7168,2048,8,256,4,8,power_law_1.2,0.2154560089111328
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,7168,2048,8,256,4,8,power_law_1.2,0.05909759998321533
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,7168,2048,8,256,4,8,power_law_1.2,0.07468799948692321
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,7168,2048,8,256,4,8,power_law_1.2,0.22081279754638672
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,7168,2048,8,256,4,8,power_law_1.2,0.08556159734725952
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,7168,2048,8,256,8,4,balanced,0.05628266433874766
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,7168,2048,8,256,4,8,power_law_1.2,0.27946879863739016
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,7168,2048,8,256,4,8,power_law_1.2,0.09932799935340882
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,7168,2048,8,256,8,4,balanced,0.05857066810131073
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,7168,2048,8,256,4,8,power_law_1.2,0.11978880167007447
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,7168,2048,8,256,4,8,power_law_1.2,0.3162496089935303
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,7168,2048,8,256,4,8,power_law_1.2,0.12563199996948243
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,7168,2048,8,256,8,4,balanced,0.06758933266003926
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,7168,2048,8,256,4,8,power_law_1.2,0.4046016216278076
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,7168,2048,8,256,4,8,power_law_1.2,0.12305920124053955
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,7168,2048,8,256,8,4,balanced,0.08940266569455464
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,7168,2048,8,256,4,8,power_law_1.2,0.1294592022895813
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,7168,2048,8,256,4,8,power_law_1.2,0.4949632167816162
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,7168,2048,8,256,4,8,power_law_1.2,0.13824000358581542
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,7168,2048,8,256,8,4,balanced,0.1348960002263387
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,7168,2048,8,256,4,8,power_law_1.2,0.1547968029975891
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,7168,2048,8,256,4,8,power_law_1.2,0.6151936054229736
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,7168,2048,8,256,8,4,balanced,0.21010132630666098
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,7168,2048,8,256,4,8,power_law_1.2,0.15678720474243163
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,7168,2048,8,256,8,4,balanced,0.21134400367736816
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,7168,2048,8,256,4,8,power_law_1.2,0.16412800550460815
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,7168,2048,8,256,4,8,power_law_1.2,0.8525055885314942
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,7168,2048,8,256,4,8,power_law_1.2,0.18343679904937743
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,7168,2048,8,256,8,4,balanced,0.2109066645304362
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,7168,2048,8,256,4,8,power_law_1.2,1.2519935607910155
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,7168,2048,8,256,4,8,power_law_1.2,0.20213119983673095
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,7168,2048,8,256,8,4,balanced,0.21368000904719034
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,7168,2048,8,256,8,4,balanced,0.21409066518147787
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,7168,2048,8,256,4,8,power_law_1.2,0.21546239852905275
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,7168,2048,8,256,4,8,power_law_1.2,1.6236799240112305
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,7168,2048,8,256,8,4,balanced,0.2176426649093628
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,7168,2048,8,256,4,8,power_law_1.2,1.8597824096679687
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,7168,2048,8,256,8,4,balanced,0.2213546633720398
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,7168,2048,8,256,4,8,power_law_1.2,0.26165759563446045
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,7168,2048,8,256,8,4,balanced,0.22348799308141074
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,7168,2048,8,256,4,8,power_law_1.2,2.957151985168457
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,7168,2048,8,256,8,4,balanced,0.2278133432070414
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,7168,2048,8,256,8,4,balanced,0.23282132546106973
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,256,4,8,power_law_1.2,0.2831360101699829
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,7168,2048,8,256,4,8,power_law_1.2,7.198649597167969
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,256,4,8,power_law_1.2,0.3762943983078003
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,7168,2048,8,256,8,4,balanced,0.23576533794403076
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,256,4,8,power_law_1.2,0.47171840667724607
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,7168,2048,8,256,8,4,balanced,0.24514667193094888
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,256,4,8,power_law_1.2,0.6246335983276368
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,7168,2048,8,256,8,4,balanced,0.26682132482528687
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,256,4,8,power_law_1.2,0.8180031776428223
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,256,4,8,power_law_1.2,1.052678394317627
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,7168,2048,8,256,8,4,balanced,0.295087993144989
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,256,4,8,power_law_1.2,1.663916778564453
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,7168,2048,8,256,8,4,balanced,0.331712007522583
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,256,4,8,power_law_1.2,2.1979391098022463
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,256,4,8,power_law_1.2,2.464851188659668
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,7168,2048,8,256,8,4,balanced,0.3633333444595337
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,256,4,8,power_law_1.2,3.8377025604248045
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,7168,2048,8,256,8,4,balanced,0.421183983484904
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,256,4,8,power_law_1.2,6.166041564941406
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,7168,2048,8,256,8,4,balanced,0.4978026549021403
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,256,4,8,power_law_1.2,12.534374237060547
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,7168,2048,8,256,8,4,balanced,0.6457440058390299
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,7168,2048,8,256,8,4,balanced,0.04907733201980591
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,7168,2048,8,256,8,4,balanced,0.7780693372090658
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,7168,2048,8,256,8,4,balanced,0.051125332713127136
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,7168,2048,8,256,8,4,balanced,0.05516799787680308
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,7168,2048,8,256,8,4,balanced,0.07213333249092102
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,7168,2048,8,256,8,4,balanced,0.0974026620388031
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,7168,2048,8,256,8,4,balanced,0.14626666903495789
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,7168,2048,8,256,8,4,balanced,0.14948266744613647
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,7168,2048,8,256,8,4,balanced,1.091429313023885
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,7168,2048,8,256,8,4,balanced,0.1513653298219045
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,7168,2048,8,256,8,4,balanced,0.15172800421714783
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,7168,2048,8,256,8,4,power_law_1.01,0.06532480120658875
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,7168,2048,8,256,8,4,balanced,0.1529706617196401
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,7168,2048,8,256,8,4,balanced,0.05825066566467285
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,7168,2048,8,256,8,4,power_law_1.01,0.08157439827919007
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,7168,2048,8,256,8,4,balanced,0.15543466806411743
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,7168,2048,8,256,8,4,balanced,0.06319466729958852
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,7168,2048,8,256,8,4,power_law_1.01,0.06960639953613282
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,7168,2048,8,256,8,4,balanced,0.15968533356984457
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,7168,2048,8,256,8,4,balanced,0.06769600013891856
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,7168,2048,8,256,8,4,power_law_1.01,0.08210560083389282
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,7168,2048,8,256,8,4,balanced,0.16286933422088623
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,7168,2048,8,256,8,4,balanced,0.08556266625722249
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,7168,2048,8,256,8,4,power_law_1.01,0.11233919858932495
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,7168,2048,8,256,8,4,balanced,1.386954625447591
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,7168,2048,8,256,8,4,balanced,0.1670186718304952
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,7168,2048,8,256,8,4,balanced,0.11050666371981303
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,7168,2048,8,256,8,4,power_law_1.01,0.13191039562225343
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,7168,2048,8,256,8,4,balanced,0.17460266749064127
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,7168,2048,8,256,8,4,balanced,0.16084800163904825
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,7168,2048,8,256,8,4,power_law_1.01,0.16637439727783204
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,7168,2048,8,256,8,4,balanced,0.1787466605504354
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,7168,2048,8,256,8,4,balanced,0.164383997519811
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,7168,2048,8,256,8,4,power_law_1.01,0.16989439725875854
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,7168,2048,8,256,8,4,balanced,0.18686399857203165
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,7168,2048,8,256,8,4,balanced,0.16538133223851523
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,7168,2048,8,256,8,4,power_law_1.01,0.17766400575637817
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,7168,2048,8,256,8,4,balanced,0.1676106651624044
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,7168,2048,8,256,8,4,balanced,0.20664000511169434
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,7168,2048,8,256,8,4,power_law_1.01,0.18257280588150024
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,7168,2048,8,256,8,4,balanced,0.17060800393422446
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,7168,2048,8,256,8,4,balanced,0.23506667216618857
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,7168,2048,8,256,8,4,balanced,0.17347200711568198
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,7168,2048,8,256,8,4,power_law_1.01,0.1894592046737671
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,7168,2048,8,256,8,4,balanced,0.2760053277015686
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,7168,2048,8,256,8,4,balanced,0.17674134174982706
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,7168,2048,8,256,8,4,power_law_1.01,0.20261759757995607
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,7168,2048,8,256,8,4,balanced,1.8428746859232585
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,7168,2048,8,256,8,4,power_law_1.01,0.054054397344589236
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,7168,2048,8,256,8,4,balanced,0.18131732940673828
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,7168,2048,8,256,8,4,power_law_1.01,0.2168639898300171
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,7168,2048,8,256,8,4,balanced,0.30237332979838055
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,7168,2048,8,256,8,4,power_law_1.01,0.06592640280723572
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,7168,2048,8,256,8,4,balanced,0.1881386637687683
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,7168,2048,8,256,8,4,power_law_1.01,0.22367360591888427
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,7168,2048,8,256,8,4,power_law_1.01,0.05607039928436279
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,7168,2048,8,256,8,4,balanced,0.20288532972335815
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,7168,2048,8,256,8,4,power_law_1.01,0.24670720100402832
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,7168,2048,8,256,8,4,balanced,0.3722879886627197
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,7168,2048,8,256,8,4,power_law_1.01,0.06435840129852295
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,7168,2048,8,256,8,4,balanced,0.20719999074935913
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,7168,2048,8,256,8,4,power_law_1.01,0.2580672025680542
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,7168,2048,8,256,8,4,power_law_1.01,0.08263040184974671
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,7168,2048,8,256,8,4,power_law_1.01,0.24909439086914062
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,7168,2048,8,256,8,4,balanced,0.21884800990422568
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,7168,2048,8,256,8,4,balanced,0.46135465304056805
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,7168,2048,8,256,8,4,power_law_1.01,0.09667199850082397
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,7168,2048,8,256,8,4,power_law_1.01,0.3219199895858765
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,7168,2048,8,256,8,4,power_law_1.01,0.1218559980392456
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,7168,2048,8,256,8,4,power_law_1.01,0.3464384078979492
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,7168,2048,8,256,8,4,power_law_1.01,0.1255295991897583
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,7168,2048,8,256,8,4,power_law_1.01,0.401580810546875
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,7168,2048,8,256,8,4,balanced,0.6244213183720907
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,7168,2048,8,256,8,4,power_law_1.01,0.1266111969947815
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,7168,2048,8,256,8,4,balanced,0.2560906608899434
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,7168,2048,8,256,8,4,power_law_1.01,0.41210241317749025
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,7168,2048,8,256,8,4,power_law_1.01,0.12819199562072753
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,7168,2048,8,256,8,4,power_law_1.01,0.49570560455322266
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,7168,2048,8,256,8,4,power_law_1.01,0.13963520526885986
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,7168,2048,8,256,8,4,power_law_1.01,0.6082560062408447
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,7168,2048,8,256,8,4,balanced,2.665701389312744
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,7168,2048,8,256,8,4,power_law_1.01,0.14067840576171875
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,7168,2048,8,256,8,4,balanced,0.7857973575592041
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,7168,2048,8,256,8,4,power_law_1.01,0.7969215869903564
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,7168,2048,8,256,8,4,power_law_1.01,0.1520640015602112
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,7168,2048,8,256,8,4,power_law_1.01,0.9261887550354004
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,256,8,4,balanced,0.32339733839035034
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,7168,2048,8,256,8,4,power_law_1.01,0.16027519702911378
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,7168,2048,8,256,8,4,power_law_1.01,1.3354175567626954
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,7168,2048,8,256,8,4,power_law_1.01,0.0704576015472412
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,7168,2048,8,256,8,4,power_law_1.01,0.1694208025932312
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,256,8,4,balanced,0.41119468212127686
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,7168,2048,8,256,8,4,power_law_1.01,0.18164479732513428
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,7168,2048,8,256,8,4,power_law_1.01,1.6372671127319336
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,7168,2048,8,256,8,4,power_law_1.01,0.0831488013267517
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,7168,2048,8,256,8,4,power_law_1.01,0.07015680074691773
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,7168,2048,8,256,8,4,power_law_1.01,0.19094400405883788
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,256,8,4,balanced,0.456986665725708
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,7168,2048,8,256,8,4,power_law_1.01,2.2045568466186523
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,7168,2048,8,256,8,4,power_law_1.01,0.08401920199394226
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,7168,2048,8,256,8,4,balanced,1.1557119687398274
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,7168,2048,8,256,8,4,power_law_1.01,0.2172032117843628
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,7168,2048,8,256,8,4,power_law_1.01,0.09594240188598632
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,7168,2048,8,256,8,4,power_law_1.01,0.25148160457611085
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,7168,2048,8,256,8,4,power_law_1.01,3.185049629211426
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,7168,2048,8,256,8,4,power_law_1.01,0.11612160205841064
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,256,8,4,balanced,0.6418293317159017
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,7168,2048,8,256,8,4,power_law_1.01,0.13582719564437867
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,7168,2048,8,256,8,4,power_law_1.01,0.3009471893310547
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,7168,2048,8,256,8,4,power_law_1.01,0.14156800508499146
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,7168,2048,8,256,8,4,power_law_1.01,6.443174743652344
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,7168,2048,8,256,8,4,power_law_1.01,0.35330560207366946
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,7168,2048,8,256,8,4,power_law_1.01,0.14885120391845702
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,7168,2048,8,256,8,4,power_law_1.01,0.4235583782196045
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,256,8,4,balanced,0.7649813493092855
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,7168,2048,8,256,8,4,power_law_1.01,0.15371520519256593
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,7168,2048,8,256,8,4,power_law_1.01,0.5295743942260742
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,7168,2048,8,256,8,4,power_law_1.01,0.16388479471206666
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,7168,2048,8,256,8,4,power_law_1.01,0.17619839906692505
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,7168,2048,8,256,8,4,power_law_1.01,0.7291840076446533
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,7168,2048,8,256,8,4,balanced,1.4184640248616536
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,7168,2048,8,256,8,4,power_law_1.01,0.1829375982284546
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,7168,2048,8,256,8,4,power_law_1.01,0.20034561157226563
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,256,8,4,balanced,1.171008030573527
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,7168,2048,8,256,8,4,power_law_1.01,0.932044792175293
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,7168,2048,8,256,8,4,power_law_1.01,0.22213120460510255
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,7168,2048,8,256,8,4,power_law_1.01,0.23939199447631837
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,7168,2048,8,256,8,4,power_law_1.01,1.2631808280944825
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,7168,2048,8,256,8,4,power_law_1.01,0.26447999477386475
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,7168,2048,8,256,8,4,power_law_1.01,1.6624191284179688
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,256,8,4,balanced,1.442197322845459
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,7168,2048,8,256,8,4,power_law_1.01,0.3326783895492554
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,7168,2048,8,256,8,4,power_law_1.01,2.1271551132202147
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,256,8,4,power_law_1.01,0.3791232109069824
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,7168,2048,8,256,8,4,balanced,1.8395840326944988
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,7168,2048,8,256,8,4,power_law_1.01,3.2503616333007814
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,256,8,4,power_law_1.01,0.4875967979431152
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,7168,2048,8,256,8,4,power_law_1.2,0.06602879762649536
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,256,8,4,power_law_1.01,0.5678207874298096
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,256,8,4,balanced,2.098031997680664
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,7168,2048,8,256,8,4,balanced,5.2697493235270185
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,7168,2048,8,256,8,4,power_law_1.01,6.6525123596191404
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,256,8,4,power_law_1.01,0.798086404800415
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,7168,2048,8,256,8,4,power_law_1.2,0.07995520234107971
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,256,8,4,power_law_1.01,1.004678440093994
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,7168,2048,8,256,8,4,power_law_1.2,0.0642687976360321
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,256,8,4,power_law_1.01,1.4286527633666992
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,256,8,4,power_law_1.01,1.6878080368041992
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,7168,2048,8,256,8,4,power_law_1.2,0.08565760254859925
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,256,8,4,power_law_1.01,2.629439926147461
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,7168,2048,8,256,8,4,power_law_1.2,0.09638400077819824
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,256,8,4,power_law_1.01,3.3180862426757813
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,7168,2048,8,256,8,4,power_law_1.2,0.12244479656219483
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,7168,2048,8,256,8,4,power_law_1.2,0.05428479909896851
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,256,8,4,power_law_1.01,4.401574325561524
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,7168,2048,8,256,8,4,power_law_1.2,0.16278400421142578
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,7168,2048,8,256,8,4,power_law_1.2,0.06586880087852479
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,256,8,4,balanced,2.7484747568766275
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,256,8,4,power_law_1.01,6.596991729736328
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,7168,2048,8,256,8,4,power_law_1.2,0.1716928005218506
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,7168,2048,8,256,8,4,power_law_1.2,0.056627202033996585
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,7168,2048,8,256,8,4,power_law_1.2,0.17834240198135376
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,7168,2048,8,256,8,4,power_law_1.2,0.06901119947433472
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,256,8,4,power_law_1.01,12.974137878417968
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,7168,2048,8,256,8,4,power_law_1.2,0.18266240358352662
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,7168,2048,8,256,8,4,balanced,2.7616745630900064
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,7168,2048,8,256,8,4,power_law_1.2,0.07927039861679078
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,7168,2048,8,256,8,4,power_law_1.2,0.1955456018447876
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,7168,2048,8,256,8,4,power_law_1.2,0.09461119771003723
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,7168,2048,8,256,8,4,power_law_1.2,0.1985856056213379
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,7168,2048,8,256,8,4,power_law_1.2,0.11940480470657348
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,7168,2048,8,256,8,4,power_law_1.2,0.21528959274291992
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,7168,2048,8,256,8,4,power_law_1.2,0.1205888032913208
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,7168,2048,8,256,8,4,power_law_1.2,0.2275264024734497
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,256,8,4,balanced,3.4213279088338218
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,7168,2048,8,256,8,4,power_law_1.2,0.253606390953064
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,7168,2048,8,256,8,4,power_law_1.2,0.12414720058441162
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,7168,2048,8,256,8,4,power_law_1.2,0.26689920425415037
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,7168,2048,8,256,8,4,power_law_1.2,0.12602239847183228
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,7168,2048,8,256,8,4,power_law_1.2,0.13746559619903564
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,7168,2048,8,256,8,4,power_law_1.2,0.3033663988113403
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,7168,2048,8,256,8,4,power_law_1.2,0.14810880422592163
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,7168,2048,8,256,8,4,power_law_1.2,0.3315840005874634
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,7168,2048,8,256,8,4,power_law_1.2,0.35323519706726075
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,7168,2048,8,256,8,4,power_law_1.2,0.14953600168228148
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,7168,2048,8,256,8,4,power_law_1.2,0.40414719581604003
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,7168,2048,8,256,8,4,power_law_1.2,0.16346240043640137
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,7168,2048,8,256,8,4,power_law_1.2,0.423737621307373
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,7168,2048,8,256,8,4,power_law_1.2,0.17637120485305785
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,7168,2048,8,256,8,4,power_law_1.2,0.543833589553833
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,7168,2048,8,256,8,4,power_law_1.2,0.18494720458984376
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,7168,2048,8,256,8,4,power_law_1.2,0.657862377166748
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,7168,2048,8,256,8,4,power_law_1.2,0.19768960475921632
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,7168,2048,8,256,8,4,power_law_1.2,0.8515392303466797
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,7168,2048,8,256,8,4,power_law_1.2,0.22953600883483888
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,7168,2048,8,256,8,4,power_law_1.2,1.007756805419922
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,7168,2048,8,256,8,4,power_law_1.2,0.2587007999420166
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,256,8,4,balanced,5.433045069376628
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,7168,2048,8,256,8,4,power_law_1.2,0.3368832111358643
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,7168,2048,8,256,8,4,power_law_1.2,1.3670720100402831
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,7168,2048,8,256,8,4,power_law_1.2,0.36438400745391847
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,7168,2048,8,256,8,4,power_law_1.2,1.8464576721191406
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,7168,2048,8,256,8,4,power_law_1.2,0.4526336193084717
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,7168,2048,8,256,8,4,power_law_1.2,2.2480255126953126
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,7168,2048,8,256,8,4,power_law_1.2,0.5632256031036377
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,7168,2048,8,256,8,4,power_law_1.2,3.9167102813720702
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,7168,2048,8,256,8,4,power_law_1.2,0.7699391841888428
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,7168,2048,8,256,8,4,balanced,5.448346455891927
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,7168,2048,8,256,8,4,power_law_1.2,1.0059328079223633
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,7168,2048,8,256,8,4,power_law_1.2,7.6742401123046875
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,7168,2048,8,256,8,4,power_law_1.2,1.449350357055664
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,7168,2048,8,256,8,4,power_law_1.2,1.9394176483154297
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,7168,2048,8,256,8,4,power_law_1.2,2.2840703964233398
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,7168,2048,8,256,8,4,power_law_1.2,3.4738433837890623
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,7168,2048,8,256,8,4,power_law_1.2,7.29583969116211
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,256,8,4,balanced,10.78427759806315
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,7168,2048,8,256,8,4,power_law_1.2,0.07056639790534973
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,7168,2048,8,256,8,4,power_law_1.2,0.08343039751052857
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,7168,2048,8,256,8,4,power_law_1.2,0.06803200244903565
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,7168,2048,8,256,8,4,power_law_1.2,0.08323839902877808
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,7168,2048,8,256,8,4,power_law_1.2,0.09820799827575684
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,7168,2048,8,256,8,4,power_law_1.2,0.1106112003326416
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,7168,2048,8,256,8,4,power_law_1.2,0.13484159708023072
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,7168,2048,8,256,8,4,power_law_1.2,0.1414720058441162
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,7168,2048,8,256,8,4,power_law_1.2,0.1458624005317688
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,7168,2048,8,256,8,4,power_law_1.2,0.15267200469970704
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,7168,2048,8,256,8,4,power_law_1.2,0.16344319581985473
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,7168,2048,8,256,8,4,power_law_1.2,0.17253119945526124
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,7168,2048,8,256,8,4,power_law_1.2,0.18891520500183107
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,7168,2048,8,256,8,4,power_law_1.2,0.2093440055847168
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,7168,2048,8,256,8,4,power_law_1.2,0.22183680534362793
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,7168,2048,8,256,8,4,power_law_1.2,0.2427839994430542
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,7168,2048,8,256,8,4,power_law_1.2,0.274835205078125
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,7168,2048,8,256,16,2,balanced,0.058261334896087646
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,7168,2048,8,256,16,2,balanced,0.051728000243504844
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,7168,2048,8,256,16,2,balanced,0.061674664417902626
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,7168,2048,8,256,16,2,balanced,0.05472533404827118
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,7168,2048,8,256,16,2,balanced,0.07144533097743988
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,7168,2048,8,256,16,2,balanced,0.060736000537872314
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,7168,2048,8,256,8,4,power_law_1.2,0.3486527919769287
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,7168,2048,8,256,16,2,balanced,0.09675733248392741
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,7168,2048,8,256,16,2,balanced,0.08194666604201
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,7168,2048,8,256,16,2,balanced,0.14748266339302063
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,7168,2048,8,256,16,2,balanced,0.11717866857846577
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,256,8,4,power_law_1.2,0.3767807960510254
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,7168,2048,8,256,16,2,balanced,0.2391306757926941
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,7168,2048,8,256,16,2,balanced,0.1788640022277832
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,7168,2048,8,256,16,2,balanced,0.2413333257039388
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,256,8,4,power_law_1.2,0.48636159896850584
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,7168,2048,8,256,16,2,balanced,0.1800533334414164
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,7168,2048,8,256,16,2,balanced,0.24410132567087808
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,7168,2048,8,256,16,2,balanced,0.18128534158070883
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,256,8,4,power_law_1.2,0.6257408142089844
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,7168,2048,8,256,16,2,balanced,0.2460213303565979
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,7168,2048,8,256,16,2,balanced,0.18463999032974243
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,256,8,4,power_law_1.2,0.8453760147094727
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,7168,2048,8,256,16,2,balanced,0.2499786615371704
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,7168,2048,8,256,16,2,balanced,0.1851573387781779
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,256,8,4,power_law_1.2,1.0080896377563477
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,7168,2048,8,256,16,2,balanced,0.18784000476201376
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,7168,2048,8,256,16,2,balanced,0.25410666068394977
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,256,8,4,power_law_1.2,1.4669504165649414
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,7168,2048,8,256,16,2,balanced,0.19192532698313394
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,7168,2048,8,256,16,2,balanced,0.26014933983484906
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,7168,2048,8,256,16,2,balanced,0.080335999528567
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,7168,2048,8,256,16,2,balanced,0.19437867403030396
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,256,8,4,power_law_1.2,1.9469375610351562
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,7168,2048,8,256,16,2,balanced,0.2629706660906474
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,7168,2048,8,256,16,2,balanced,0.08523733417193095
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,7168,2048,8,256,16,2,balanced,0.25327465931574505
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,7168,2048,8,256,16,2,balanced,0.198362668355306
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,256,8,4,power_law_1.2,2.8116031646728517
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,7168,2048,8,256,16,2,balanced,0.09244799613952637
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,7168,2048,8,256,16,2,balanced,0.20916267236073813
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,7168,2048,8,256,16,2,balanced,0.2608746687571208
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,256,8,4,power_law_1.2,4.06864013671875
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,7168,2048,8,256,16,2,balanced,0.11265599727630615
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,7168,2048,8,256,16,2,balanced,0.21406400203704834
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,7168,2048,8,256,16,2,balanced,0.26572267214457196
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,7168,2048,8,256,16,2,balanced,0.14324800173441568
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,256,8,4,power_law_1.2,4.6539966583251955
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,7168,2048,8,256,16,2,balanced,0.27539199590682983
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,7168,2048,8,256,16,2,balanced,0.22924800713857016
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,7168,2048,8,256,16,2,balanced,0.21450134118398032
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,7168,2048,8,256,16,2,balanced,0.21922133366266885
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,7168,2048,8,256,16,2,balanced,0.31010133028030396
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,256,8,4,power_law_1.2,7.625273895263672
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,7168,2048,8,256,16,2,balanced,0.26363199949264526
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,7168,2048,8,256,16,2,balanced,0.2228906750679016
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,7168,2048,8,256,16,2,balanced,0.3535733222961426
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,7168,2048,8,256,16,2,balanced,0.22609599431355795
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,7168,2048,8,256,16,2,balanced,0.30477867523829144
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,7168,2048,8,256,16,2,balanced,0.2307680050532023
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,256,8,4,power_law_1.2,15.111846923828125
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,7168,2048,8,256,16,2,balanced,0.40514667828877765
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,7168,2048,8,256,16,2,balanced,0.35016000270843506
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,7168,2048,8,256,16,2,balanced,0.23753066857655844
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,7168,2048,8,256,16,2,balanced,0.24368532498677573
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,7168,2048,8,256,16,2,balanced,0.39772268136342365
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,7168,2048,8,256,16,2,balanced,0.43966400623321533
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,7168,2048,8,256,16,2,balanced,0.25126399596532184
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,7168,2048,8,256,16,2,balanced,0.2648319999376933
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,7168,2048,8,256,16,2,balanced,0.5187893311182658
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,7168,2048,8,256,16,2,balanced,0.5581173499425253
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,7168,2048,8,256,16,2,balanced,0.2834346691767375
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,7168,2048,8,256,16,2,balanced,0.2959413329760234
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,7168,2048,8,256,16,2,balanced,0.6490773359934489
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,7168,2048,8,256,16,2,balanced,0.678272008895874
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,7168,2048,8,256,16,2,balanced,0.3187733292579651
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,7168,2048,8,256,16,2,balanced,0.9288372993469238
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,7168,2048,8,256,16,2,balanced,0.9529066880544027
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,7168,2048,8,256,16,2,balanced,0.41067731380462646
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,7168,2048,8,256,16,2,balanced,1.1916853586832683
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,7168,2048,8,256,16,2,balanced,1.1932106812795003
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,7168,2048,8,256,16,2,power_law_1.01,0.058931201696395874
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,7168,2048,8,256,16,2,power_law_1.01,0.052160000801086424
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,7168,2048,8,256,16,2,power_law_1.01,0.06878079771995545
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,7168,2048,8,256,16,2,power_law_1.01,0.05870720148086548
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,256,16,2,balanced,0.5224426587422689
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,7168,2048,8,256,16,2,power_law_1.01,0.06628479957580566
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,7168,2048,8,256,16,2,power_law_1.01,0.0584447979927063
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,256,16,2,balanced,0.6595253149668375
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,7168,2048,8,256,16,2,power_law_1.01,0.08169599771499633
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,7168,2048,8,256,16,2,power_law_1.01,0.07125759720802308
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,7168,2048,8,256,16,2,balanced,1.7336053848266602
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,7168,2048,8,256,16,2,power_law_1.01,0.10849920511245728
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,7168,2048,8,256,16,2,power_law_1.01,0.09280639886856079
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,7168,2048,8,256,16,2,balanced,1.7221280733744304
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,256,16,2,balanced,0.7439733346303304
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,7168,2048,8,256,16,2,power_law_1.01,0.13803520202636718
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,7168,2048,8,256,16,2,power_law_1.01,0.11071360111236572
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,7168,2048,8,256,16,2,power_law_1.01,0.18068480491638184
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,7168,2048,8,256,16,2,power_law_1.01,0.14005119800567628
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,256,16,2,balanced,1.0797866980234783
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,7168,2048,8,256,16,2,power_law_1.01,0.19527039527893067
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,7168,2048,8,256,16,2,power_law_1.01,0.08158079981803894
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,7168,2048,8,256,16,2,power_law_1.01,0.14693119525909423
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,7168,2048,8,256,16,2,power_law_1.01,0.19536639451980592
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,7168,2048,8,256,16,2,power_law_1.01,0.08780159950256347
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,7168,2048,8,256,16,2,power_law_1.01,0.14984960556030275
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,256,16,2,balanced,1.297871987024943
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,7168,2048,8,256,16,2,power_law_1.01,0.20055680274963378
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,7168,2048,8,256,16,2,power_law_1.01,0.09072639942169189
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,7168,2048,8,256,16,2,power_law_1.01,0.15667840242385864
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,7168,2048,8,256,16,2,power_law_1.01,0.21575679779052734
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,7168,2048,8,256,16,2,balanced,2.125429312388102
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,7168,2048,8,256,16,2,power_law_1.2,0.05857920050621033
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,7168,2048,8,256,16,2,power_law_1.01,0.10954879522323609
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,7168,2048,8,256,16,2,power_law_1.01,0.16446720361709594
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,7168,2048,8,256,16,2,balanced,2.1310027440389
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,7168,2048,8,256,16,2,power_law_1.01,0.23155839443206788
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,7168,2048,8,256,16,2,power_law_1.2,0.06680960059165955
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,7168,2048,8,256,16,2,power_law_1.01,0.12193919420242309
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,7168,2048,8,256,16,2,power_law_1.01,0.1749824047088623
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,256,16,2,balanced,2.0058773358662925
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,7168,2048,8,256,16,2,power_law_1.01,0.23885440826416016
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,7168,2048,8,256,16,2,power_law_1.2,0.06574079990386963
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,7168,2048,8,256,16,2,power_law_1.01,0.14258559942245483
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,7168,2048,8,256,16,2,power_law_1.01,0.18390400409698487
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,7168,2048,8,256,16,2,power_law_1.01,0.2383552074432373
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,7168,2048,8,256,16,2,power_law_1.2,0.07890560030937195
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,7168,2048,8,256,16,2,power_law_1.01,0.17582080364227295
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,7168,2048,8,256,16,2,power_law_1.01,0.25328640937805175
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,7168,2048,8,256,16,2,power_law_1.01,0.1998271942138672
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,7168,2048,8,256,16,2,power_law_1.2,0.10580480098724365
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,7168,2048,8,256,16,2,power_law_1.01,0.19186559915542603
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,7168,2048,8,256,16,2,power_law_1.01,0.27956480979919435
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,7168,2048,8,256,16,2,power_law_1.01,0.21578879356384278
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,256,16,2,balanced,2.484048048655192
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,7168,2048,8,256,16,2,power_law_1.2,0.12949759960174562
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,7168,2048,8,256,16,2,power_law_1.01,0.20205440521240234
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,7168,2048,8,256,16,2,power_law_1.01,0.28475520610809324
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,7168,2048,8,256,16,2,power_law_1.01,0.23379199504852294
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,7168,2048,8,256,16,2,power_law_1.2,0.1753600001335144
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,7168,2048,8,256,16,2,power_law_1.01,0.20239999294281005
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,7168,2048,8,256,16,2,power_law_1.01,0.36669440269470216
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,7168,2048,8,256,16,2,power_law_1.01,0.24527359008789062
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,7168,2048,8,256,16,2,power_law_1.01,0.21960320472717285
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,7168,2048,8,256,16,2,power_law_1.2,0.18866560459136963
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,7168,2048,8,256,16,2,balanced,2.811024030049642
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,7168,2048,8,256,16,2,power_law_1.01,0.4107071876525879
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,7168,2048,8,256,16,2,power_law_1.01,0.28124160766601564
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,7168,2048,8,256,16,2,balanced,2.8133440017700195
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,7168,2048,8,256,16,2,power_law_1.01,0.23249919414520265
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,7168,2048,8,256,16,2,power_law_1.2,0.19822720289230347
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,7168,2048,8,256,16,2,power_law_1.01,0.48618879318237307
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,7168,2048,8,256,16,2,power_law_1.01,0.3140736103057861
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,7168,2048,8,256,16,2,power_law_1.01,0.2405247926712036
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,7168,2048,8,256,16,2,power_law_1.2,0.20794239044189453
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,7168,2048,8,256,16,2,power_law_1.01,0.5511871814727783
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,7168,2048,8,256,16,2,power_law_1.01,0.37061760425567625
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,256,16,2,balanced,3.673551877339681
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,7168,2048,8,256,16,2,power_law_1.2,0.22055680751800538
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,7168,2048,8,256,16,2,power_law_1.01,0.27151999473571775
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,7168,2048,8,256,16,2,power_law_1.01,0.680940818786621
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,7168,2048,8,256,16,2,power_law_1.01,0.46515841484069825
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,7168,2048,8,256,16,2,power_law_1.01,0.29268479347229004
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,7168,2048,8,256,16,2,power_law_1.2,0.2321471929550171
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,7168,2048,8,256,16,2,power_law_1.01,0.770911979675293
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,7168,2048,8,256,16,2,power_law_1.01,0.58122239112854
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,7168,2048,8,256,16,2,power_law_1.01,0.3240895986557007
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,7168,2048,8,256,16,2,power_law_1.2,0.2407615900039673
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,7168,2048,8,256,16,2,power_law_1.01,1.0564096450805665
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,7168,2048,8,256,16,2,power_law_1.01,0.6960319995880127
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,7168,2048,8,256,16,2,power_law_1.01,0.38098559379577634
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,7168,2048,8,256,16,2,power_law_1.2,0.23834240436553955
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,7168,2048,8,256,16,2,power_law_1.01,1.308255958557129
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,7168,2048,8,256,16,2,power_law_1.2,0.2746623992919922
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,7168,2048,8,256,16,2,power_law_1.01,0.9743616104125976
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,7168,2048,8,256,16,2,power_law_1.01,1.798700714111328
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,7168,2048,8,256,16,2,power_law_1.2,0.31011199951171875
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,7168,2048,8,256,16,2,power_law_1.01,1.2759936332702637
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,7168,2048,8,256,16,2,power_law_1.01,0.49729280471801757
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,7168,2048,8,256,16,2,power_law_1.01,2.3318975448608397
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,7168,2048,8,256,16,2,power_law_1.2,0.31578240394592283
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,256,16,2,balanced,4.857338587443034
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,7168,2048,8,256,16,2,power_law_1.01,1.7657535552978516
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,7168,2048,8,256,16,2,power_law_1.2,0.3771775960922241
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,7168,2048,8,256,16,2,power_law_1.01,2.8347135543823243
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,7168,2048,8,256,16,2,power_law_1.01,2.250163269042969
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,256,16,2,power_law_1.01,0.5467711925506592
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,7168,2048,8,256,16,2,power_law_1.2,0.4114880084991455
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,7168,2048,8,256,16,2,power_law_1.01,4.300262451171875
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,7168,2048,8,256,16,2,power_law_1.2,0.5008704185485839
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,256,16,2,power_law_1.01,0.7168511867523193
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,7168,2048,8,256,16,2,power_law_1.01,2.8291904449462892
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,7168,2048,8,256,16,2,balanced,4.1531680425008135
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,7168,2048,8,256,16,2,balanced,4.091738700866699
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,7168,2048,8,256,16,2,power_law_1.2,0.5794367790222168
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,256,16,2,power_law_1.01,0.8670783996582031
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,7168,2048,8,256,16,2,power_law_1.01,9.832876586914063
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,7168,2048,8,256,16,2,power_law_1.01,4.593056106567383
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,7168,2048,8,256,16,2,power_law_1.2,0.6746496200561524
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,256,16,2,power_law_1.01,1.175327968597412
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,7168,2048,8,256,16,2,power_law_1.2,0.7915328025817872
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,256,16,2,power_law_1.01,1.5694592475891114
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,7168,2048,8,256,16,2,power_law_1.01,9.576032257080078
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,7168,2048,8,256,16,2,power_law_1.2,1.0977215766906738
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,256,16,2,power_law_1.01,2.2458112716674803
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,7168,2048,8,256,16,2,power_law_1.2,1.347315216064453
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,256,16,2,balanced,6.041760126749675
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,256,16,2,power_law_1.01,2.84597110748291
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,7168,2048,8,256,16,2,power_law_1.2,1.9635200500488281
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,256,16,2,power_law_1.01,3.9461185455322267
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,7168,2048,8,256,16,2,power_law_1.2,2.475859260559082
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,256,16,2,power_law_1.01,5.328646469116211
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,7168,2048,8,256,16,2,power_law_1.2,3.2116863250732424
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,256,16,2,power_law_1.01,6.618412780761719
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,7168,2048,8,256,16,2,power_law_1.2,5.0665534973144535
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,256,16,2,power_law_1.01,10.202310180664062
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,7168,2048,8,256,16,2,power_law_1.2,9.723661041259765
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,256,16,2,power_law_1.01,20.97181396484375
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,256,16,2,balanced,9.559296290079752
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,7168,2048,8,256,16,2,balanced,8.068538665771484
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,7168,2048,8,256,16,2,balanced,8.189168294270834
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,7168,2048,8,256,16,2,power_law_1.2,0.052108800411224364
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,7168,2048,8,256,16,2,power_law_1.2,0.05753600001335144
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,7168,2048,8,256,16,2,power_law_1.2,0.05692160129547119
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,7168,2048,8,256,16,2,power_law_1.2,0.07157120108604431
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,7168,2048,8,256,16,2,power_law_1.2,0.08921599984169007
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,7168,2048,8,256,16,2,power_law_1.2,0.1062656044960022
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,7168,2048,8,256,16,2,power_law_1.2,0.13829120397567748
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,7168,2048,8,256,16,2,power_law_1.2,0.1465664029121399
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,7168,2048,8,256,16,2,power_law_1.2,0.15196800231933594
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,7168,2048,8,256,16,2,power_law_1.2,0.1598080039024353
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,7168,2048,8,256,16,2,power_law_1.2,0.17253119945526124
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,7168,2048,8,256,16,2,power_law_1.2,0.17987200021743774
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,7168,2048,8,256,16,2,power_law_1.2,0.18314239978790284
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,7168,2048,8,256,16,2,power_law_1.2,0.2045056104660034
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,256,16,2,balanced,18.967973073323567
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,7168,2048,8,256,16,2,power_law_1.2,0.22188799381256102
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,7168,2048,8,256,16,2,power_law_1.2,0.23441920280456544
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,7168,2048,8,256,16,2,power_law_1.2,0.24828801155090333
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,7168,2048,8,256,16,2,power_law_1.2,0.29974400997161865
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,7168,2048,8,256,16,2,power_law_1.2,0.32836480140686036
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,7168,2048,8,256,16,2,power_law_1.2,0.3968192100524902
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,7168,2048,8,256,16,2,power_law_1.2,0.46730241775512693
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,7168,2048,8,256,16,2,power_law_1.2,0.5871103763580322
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,7168,2048,8,256,16,2,power_law_1.2,0.7310272216796875
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,7168,2048,8,256,16,2,power_law_1.2,1.0224255561828612
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,7168,2048,8,256,16,2,power_law_1.2,1.2764991760253905
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,7168,2048,8,256,16,2,power_law_1.2,1.8444992065429688
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,7168,2048,8,256,16,2,power_law_1.2,2.428793525695801
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,7168,2048,8,256,16,2,power_law_1.2,3.024569511413574
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,7168,2048,8,256,16,2,power_law_1.2,4.770649719238281
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,7168,2048,8,256,16,2,power_law_1.2,10.120537567138673
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,7168,2048,8,256,32,1,balanced,0.06400533517201741
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,7168,2048,8,256,32,1,balanced,0.07789866626262665
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,7168,2048,8,256,16,2,power_law_1.2,0.08144000172615051
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,7168,2048,8,256,32,1,balanced,0.09152533610661824
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,7168,2048,8,256,16,2,power_law_1.2,0.08814079761505127
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,7168,2048,8,256,32,1,balanced,0.12380266189575195
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,7168,2048,8,256,16,2,power_law_1.2,0.09071360230445862
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,7168,2048,8,256,32,1,balanced,0.18155733744303384
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,7168,2048,8,256,32,1,balanced,0.28887466589609784
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,7168,2048,8,256,16,2,power_law_1.2,0.10572160482406616
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,7168,2048,8,256,32,1,balanced,0.057717333237330117
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,7168,2048,8,256,32,1,balanced,0.292138675848643
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,7168,2048,8,256,16,2,power_law_1.2,0.12168320417404174
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,7168,2048,8,256,32,1,balanced,0.29366934299468994
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,7168,2048,8,256,32,1,balanced,0.0629066675901413
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,7168,2048,8,256,16,2,power_law_1.2,0.1387519955635071
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,7168,2048,8,256,32,1,balanced,0.07587199906508128
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,7168,2048,8,256,32,1,balanced,0.2967466711997986
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,7168,2048,8,256,16,2,power_law_1.2,0.17624959945678711
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,7168,2048,8,256,32,1,balanced,0.10961066683133443
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,7168,2048,8,256,32,1,balanced,0.2991093397140503
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,7168,2048,8,256,32,1,balanced,0.15850133697191873
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,7168,2048,8,256,16,2,power_law_1.2,0.18654719591140748
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,7168,2048,8,256,32,1,balanced,0.3028053243954976
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,7168,2048,8,256,32,1,balanced,0.25830399990081787
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,7168,2048,8,256,16,2,power_law_1.2,0.1941375970840454
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,7168,2048,8,256,32,1,balanced,0.3094080090522766
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,7168,2048,8,256,32,1,balanced,0.259935994942983
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,7168,2048,8,256,16,2,power_law_1.2,0.20613760948181153
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,7168,2048,8,256,32,1,balanced,0.31457600990931195
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,7168,2048,8,256,32,1,balanced,0.2635200023651123
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,7168,2048,8,256,32,1,balanced,0.266213337580363
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,7168,2048,8,256,32,1,balanced,0.320357342561086
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,7168,2048,8,256,16,2,power_law_1.2,0.2154304027557373
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,7168,2048,8,256,32,1,balanced,0.2688000003496806
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,7168,2048,8,256,32,1,balanced,0.3321760098139445
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,7168,2048,8,256,16,2,power_law_1.2,0.23745920658111572
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,7168,2048,8,256,32,1,balanced,0.27243200937906903
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,7168,2048,8,256,32,1,balanced,0.3381706476211548
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,7168,2048,8,256,16,2,power_law_1.2,0.24690558910369872
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,7168,2048,8,256,32,1,balanced,0.27960532903671265
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,7168,2048,8,256,16,2,power_law_1.2,0.27216639518737795
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,7168,2048,8,256,32,1,balanced,0.3532533248265584
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,7168,2048,8,256,32,1,balanced,0.28405332565307617
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,7168,2048,8,256,16,2,power_law_1.2,0.3034559965133667
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,7168,2048,8,256,32,1,balanced,0.2908533414204915
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,7168,2048,8,256,32,1,balanced,0.4110026756922404
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,7168,2048,8,256,16,2,power_law_1.2,0.3300607919692993
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,7168,2048,8,256,32,1,balanced,0.3011573354403178
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,7168,2048,8,256,32,1,balanced,0.4812213182449341
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,7168,2048,8,256,32,1,power_law_1.01,0.05960959792137146
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,7168,2048,8,256,16,2,power_law_1.2,0.3994431972503662
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,7168,2048,8,256,32,1,power_law_1.01,0.05324159860610962
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,7168,2048,8,256,32,1,balanced,0.3153173327445984
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,7168,2048,8,256,32,1,power_law_1.01,0.07445120215415954
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,7168,2048,8,256,32,1,balanced,0.5730239947636923
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,7168,2048,8,256,32,1,power_law_1.01,0.0634112000465393
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,7168,2048,8,256,32,1,balanced,0.3368159929911296
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,7168,2048,8,256,32,1,power_law_1.01,0.07710080146789551
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,7168,2048,8,256,32,1,power_law_1.01,0.06650239825248719
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,7168,2048,8,256,16,2,power_law_1.2,0.49030399322509766
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,7168,2048,8,256,32,1,balanced,0.4007680018742879
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,7168,2048,8,256,32,1,balanced,0.6308053334554037
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,7168,2048,8,256,32,1,power_law_1.01,0.10743039846420288
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,7168,2048,8,256,32,1,power_law_1.01,0.09356160163879394
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,7168,2048,8,256,32,1,balanced,0.4658133188883464
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,7168,2048,8,256,32,1,power_law_1.01,0.1376703977584839
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,7168,2048,8,256,32,1,power_law_1.01,0.11894400119781494
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,256,16,2,power_law_1.2,0.5473087787628174
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,7168,2048,8,256,32,1,balanced,0.8490613301595052
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,7168,2048,8,256,32,1,power_law_1.01,0.14617600440979003
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,7168,2048,8,256,32,1,power_law_1.01,0.16462719440460205
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,7168,2048,8,256,32,1,balanced,0.5359146595001221
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,256,16,2,power_law_1.2,0.7298175811767578
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,7168,2048,8,256,32,1,power_law_1.01,0.19909119606018066
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,7168,2048,8,256,32,1,power_law_1.01,0.21877760887145997
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,256,16,2,power_law_1.2,0.8793791770935059
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,7168,2048,8,256,32,1,power_law_1.01,0.20347518920898439
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,7168,2048,8,256,32,1,balanced,0.609941323598226
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,7168,2048,8,256,32,1,balanced,1.102842648824056
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,7168,2048,8,256,32,1,power_law_1.01,0.23123838901519775
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,256,16,2,power_law_1.2,1.2985216140747071
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,7168,2048,8,256,32,1,power_law_1.01,0.21665279865264891
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,7168,2048,8,256,32,1,power_law_1.01,0.2420032024383545
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,7168,2048,8,256,32,1,power_law_1.01,0.22380800247192384
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,7168,2048,8,256,32,1,balanced,0.8071413040161133
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,256,16,2,power_law_1.2,1.576249599456787
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,7168,2048,8,256,32,1,power_law_1.01,0.25068800449371337
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,7168,2048,8,256,32,1,power_law_1.01,0.23566079139709473
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,7168,2048,8,256,32,1,balanced,1.5842933654785156
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,256,16,2,power_law_1.2,2.1844608306884767
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,7168,2048,8,256,32,1,power_law_1.01,0.25975680351257324
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,7168,2048,8,256,32,1,power_law_1.01,0.24951679706573487
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,7168,2048,8,256,32,1,balanced,1.0492160320281982
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,7168,2048,8,256,32,1,power_law_1.01,0.27479679584503175
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,256,16,2,power_law_1.2,2.918911933898926
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,7168,2048,8,256,32,1,power_law_1.01,0.26462719440460203
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,7168,2048,8,256,32,1,power_law_1.01,0.2799232006072998
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,7168,2048,8,256,32,1,power_law_1.01,0.29092481136322024
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,256,16,2,power_law_1.2,4.315820693969727
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,7168,2048,8,256,32,1,power_law_1.01,0.2968575954437256
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,7168,2048,8,256,32,1,power_law_1.01,0.31994879245758057
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,7168,2048,8,256,32,1,balanced,2.005930741628011
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,7168,2048,8,256,32,1,balanced,1.52892271677653
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,7168,2048,8,256,32,1,power_law_1.01,0.3141952037811279
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,256,16,2,power_law_1.2,5.439756774902344
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,7168,2048,8,256,32,1,power_law_1.01,0.3441215991973877
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,7168,2048,8,256,32,1,power_law_1.01,0.3240384101867676
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,7168,2048,8,256,32,1,power_law_1.01,0.3562623977661133
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,256,16,2,power_law_1.2,7.507955169677734
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,7168,2048,8,256,32,1,power_law_1.01,0.36903679370880127
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,7168,2048,8,256,32,1,power_law_1.01,0.4347008228302002
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,7168,2048,8,256,32,1,power_law_1.01,0.47832322120666504
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,7168,2048,8,256,32,1,power_law_1.01,0.46592001914978026
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,256,16,2,power_law_1.2,11.127763366699218
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,7168,2048,8,256,32,1,balanced,1.990821361541748
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,7168,2048,8,256,32,1,power_law_1.01,0.5724671840667724
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,7168,2048,8,256,32,1,power_law_1.01,0.5213119983673096
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,7168,2048,8,256,32,1,balanced,2.950810750325521
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,7168,2048,8,256,32,1,power_law_1.01,0.6860223770141601
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,7168,2048,8,256,32,1,power_law_1.01,0.6720384120941162
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,7168,2048,8,256,32,1,power_law_1.01,0.8705535888671875
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,256,16,2,power_law_1.2,23.9723388671875
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,7168,2048,8,256,32,1,power_law_1.01,0.7555776119232178
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,7168,2048,8,256,32,1,power_law_1.01,1.094540786743164
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,7168,2048,8,256,32,1,power_law_1.01,0.9680512428283692
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,7168,2048,8,256,32,1,power_law_1.01,1.4832768440246582
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,7168,2048,8,256,32,1,power_law_1.01,1.1314240455627442
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,7168,2048,8,256,32,1,balanced,2.9454132715861
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,7168,2048,8,256,32,1,power_law_1.01,1.945088005065918
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,7168,2048,8,256,32,1,power_law_1.01,1.5561344146728515
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,7168,2048,8,256,32,1,power_law_1.01,2.816249656677246
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,7168,2048,8,256,32,1,power_law_1.01,1.995270347595215
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,7168,2048,8,256,32,1,balanced,3.6155519485473633
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,7168,2048,8,256,32,1,power_law_1.01,3.6301952362060548
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,7168,2048,8,256,32,1,power_law_1.01,2.861510467529297
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,7168,2048,8,256,32,1,power_law_1.01,4.473625564575196
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,7168,2048,8,256,32,1,power_law_1.01,3.6930240631103515
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,7168,2048,8,256,32,1,power_law_1.01,4.5358528137207035
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,7168,2048,8,256,32,1,power_law_1.01,7.049132537841797
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,7168,2048,8,256,32,1,balanced,3.6153173446655273
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,7168,2048,8,256,32,1,power_law_1.01,6.815885162353515
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,7168,2048,8,256,32,1,power_law_1.01,13.678509521484376
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,7168,2048,8,256,32,1,power_law_1.01,13.183258056640625
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,7168,2048,8,256,32,1,balanced,4.801221211751302
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,7168,2048,8,256,32,1,power_law_1.2,0.06007680296897888
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,7168,2048,8,256,32,1,power_law_1.2,0.0747327983379364
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,7168,2048,8,256,32,1,balanced,4.810672124226888
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,7168,2048,8,256,32,1,power_law_1.2,0.07742720246315002
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,7168,2048,8,256,32,1,power_law_1.2,0.10429439544677735
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,7168,2048,8,256,32,1,power_law_1.2,0.13267199993133544
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,7168,2048,8,256,32,1,power_law_1.2,0.15675519704818724
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,7168,2048,8,256,32,1,power_law_1.2,0.2093951940536499
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,7168,2048,8,256,32,1,power_law_1.2,0.22834560871124268
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,7168,2048,8,256,32,1,power_law_1.2,0.23372159004211426
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,7168,2048,8,256,32,1,balanced,6.689333597819011
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,7168,2048,8,256,32,1,power_law_1.2,0.24452478885650636
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,7168,2048,8,256,32,1,power_law_1.2,0.2648256063461304
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,7168,2048,8,256,32,1,power_law_1.2,0.2719871997833252
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,7168,2048,8,256,32,1,power_law_1.2,0.28568320274353026
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,7168,2048,8,256,32,1,power_law_1.2,0.30548479557037356
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,7168,2048,8,256,32,1,balanced,7.113168080647786
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,7168,2048,8,256,32,1,power_law_1.2,0.32799999713897704
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,7168,2048,8,256,32,1,power_law_1.2,0.37392001152038573
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,7168,2048,8,256,32,1,power_law_1.2,0.3811392068862915
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,7168,2048,8,256,32,1,power_law_1.2,0.4922944068908691
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,7168,2048,8,256,32,1,power_law_1.2,0.5727615833282471
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,7168,2048,8,256,32,1,power_law_1.2,0.7032127857208252
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,7168,2048,8,256,32,1,power_law_1.2,0.7631167888641357
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,7168,2048,8,256,32,1,power_law_1.2,0.9564096450805664
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,7168,2048,8,256,32,1,power_law_1.2,1.1914624214172362
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,7168,2048,8,256,32,1,power_law_1.2,1.6266559600830077
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,7168,2048,8,256,32,1,power_law_1.2,2.0203264236450194
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,7168,2048,8,256,32,1,power_law_1.2,2.920889663696289
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,7168,2048,8,256,32,1,power_law_1.2,3.7256641387939453
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,7168,2048,8,256,32,1,power_law_1.2,4.592448043823242
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,7168,2048,8,256,32,1,power_law_1.2,6.7721916198730465
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,7168,2048,8,256,32,1,power_law_1.2,13.136813354492187
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,7168,2048,8,256,32,1,balanced,13.162452697753906
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,7168,2048,8,256,32,1,balanced,13.667867024739584
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,7168,2048,8,256,32,1,power_law_1.2,0.05300480127334595
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,7168,2048,8,256,32,1,power_law_1.2,0.06238719820976257
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,7168,2048,8,256,32,1,power_law_1.2,0.06947839856147767
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,7168,2048,8,256,32,1,power_law_1.2,0.09068160057067871
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,7168,2048,8,256,32,1,power_law_1.2,0.1120576024055481
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,7168,2048,8,256,32,1,power_law_1.2,0.13663359880447387
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,7168,2048,8,256,32,1,power_law_1.2,0.19340159893035888
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,7168,2048,8,256,32,1,power_law_1.2,0.20368640422821044
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,7168,2048,8,256,32,1,power_law_1.2,0.21549439430236816
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,7168,2048,8,256,32,1,power_law_1.2,0.221068811416626
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,7168,2048,8,256,32,1,power_law_1.2,0.24174718856811522
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,7168,2048,8,256,32,1,power_law_1.2,0.2518719911575317
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,7168,2048,8,256,32,1,power_law_1.2,0.2655168056488037
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,7168,2048,8,256,32,1,power_law_1.2,0.30058879852294923
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,7168,2048,8,256,32,1,power_law_1.2,0.32257919311523436
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,7168,2048,8,256,32,1,power_law_1.2,0.35196800231933595
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,7168,2048,8,256,32,1,power_law_1.2,0.3685120105743408
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,7168,2048,8,256,32,1,power_law_1.2,0.44428157806396484
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,7168,2048,8,256,32,1,power_law_1.2,0.4983359813690186
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,7168,2048,8,256,32,1,power_law_1.2,0.5896128177642822
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,2048,768,8,128,1,32,balanced,0.024319998919963837
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,7168,2048,8,256,32,1,power_law_1.2,0.7025087833404541
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,2048,768,8,128,1,32,balanced,0.024666666984558105
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,7168,2048,8,256,32,1,power_law_1.2,0.882579231262207
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,2048,768,8,128,1,32,balanced,0.02446399877468745
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,7168,2048,8,256,32,1,power_law_1.2,1.1202112197875977
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,2048,768,8,128,1,32,balanced,0.026330667237440746
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,2048,768,8,128,1,32,balanced,0.02865600089232127
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,7168,2048,8,256,32,1,power_law_1.2,1.5443967819213866
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,2048,768,8,128,1,32,balanced,0.030080000559488933
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,2048,768,8,128,1,32,balanced,0.03378133227427801
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,7168,2048,8,256,32,1,power_law_1.2,1.9710079193115235
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,2048,768,8,128,1,32,balanced,0.03365333378314972
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,2048,768,8,128,1,32,balanced,0.028160000840822857
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,7168,2048,8,256,32,1,power_law_1.2,2.8467584609985352
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,2048,768,8,128,1,32,balanced,0.03467733412981033
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,7168,2048,8,256,32,1,power_law_1.2,3.6527359008789064
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,2048,768,8,128,1,32,balanced,0.03009066730737686
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,2048,768,8,128,1,32,balanced,0.031888000667095184
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,2048,768,8,128,1,32,balanced,0.03219199925661087
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,7168,2048,8,256,32,1,power_law_1.2,4.508768081665039
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,2048,768,8,128,1,32,balanced,0.03602133442958196
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,2048,768,8,128,1,32,balanced,0.03203733265399933
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,2048,768,8,128,1,32,balanced,0.03885333240032196
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,2048,768,8,128,1,32,balanced,0.030037333567937214
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,2048,768,8,128,1,32,balanced,0.038922667503356934
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,7168,2048,8,256,32,1,power_law_1.2,7.6688385009765625
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,2048,768,8,128,1,32,balanced,0.03196800003449122
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,2048,768,8,128,1,32,balanced,0.04031466692686081
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,2048,768,8,128,1,32,balanced,0.033930666744709015
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,2048,768,8,128,1,32,balanced,0.045365333557128906
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,7168,2048,8,256,32,1,power_law_1.2,13.694419860839844
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,2048,768,8,128,1,32,balanced,0.04660266637802124
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,2048,768,8,128,1,32,balanced,0.03498133271932602
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,2048,768,8,128,1,32,balanced,0.047509332497914634
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,2048,768,8,128,1,32,balanced,0.03515733281771342
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,2048,768,8,128,1,32,balanced,0.023269332945346832
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,2048,768,8,128,1,32,balanced,0.035173334181308746
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,2048,768,8,128,1,32,balanced,0.05161066850026449
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,2048,768,8,128,1,32,balanced,0.03495466709136963
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,2048,768,8,128,1,32,balanced,0.02362666775782903
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,2048,768,8,128,1,32,balanced,0.05287466446558634
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,2048,768,8,128,1,32,balanced,0.0359946663180987
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,2048,768,8,128,1,32,balanced,0.023557332654794056
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,2048,768,8,128,1,32,balanced,0.036101333796978
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,2048,768,8,128,1,32,balanced,0.025274666647116344
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,2048,768,8,128,1,32,balanced,0.06251733501752217
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,2048,768,8,128,1,32,balanced,0.027818667391935985
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,2048,768,8,128,1,32,balanced,0.0365280012289683
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,2048,768,8,128,1,32,balanced,0.028949332733949024
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,2048,768,8,128,1,32,balanced,0.03693866729736328
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,2048,768,8,128,1,32,balanced,0.06579733391602834
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,2048,768,8,128,1,32,balanced,0.02914133419593175
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,2048,768,8,128,1,32,balanced,0.03818133225043615
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,2048,768,8,128,1,32,balanced,0.02870933214823405
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,2048,768,8,128,1,32,balanced,0.040634666879971824
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,2048,768,8,128,1,32,balanced,0.08267199993133545
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,2048,768,8,128,1,32,balanced,0.028965334097544353
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,2048,768,8,128,1,32,balanced,0.03982399900754293
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,2048,768,8,128,1,32,balanced,0.029317334294319153
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,2048,768,8,128,1,32,balanced,0.04078399886687597
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,2048,768,8,128,1,32,balanced,0.02978666623433431
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,2048,768,8,128,1,32,balanced,0.030207999050617218
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,2048,768,8,128,1,32,balanced,0.04502399762471517
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,2048,768,8,128,1,32,balanced,0.08902933200200398
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,2048,768,8,128,1,32,balanced,0.030400000512599945
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,2048,768,8,128,1,32,balanced,0.04436799883842468
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,2048,768,8,128,1,32,balanced,0.031152000029881794
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,2048,768,8,128,1,32,balanced,0.03421866645415624
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,2048,768,8,128,1,32,balanced,0.05189333359400431
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,2048,768,8,128,1,32,balanced,0.0334346666932106
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,2048,768,8,128,1,32,balanced,0.054917335510253906
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,2048,768,8,128,1,32,balanced,0.12820800145467123
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,2048,768,8,128,1,32,balanced,0.07105599840482076
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,2048,768,8,128,1,32,balanced,0.03489066660404205
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,2048,768,8,128,1,32,balanced,0.0377813329299291
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,2048,768,8,128,1,32,balanced,0.08028266827265422
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,2048,768,8,128,1,32,balanced,0.038560000558694206
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,2048,768,8,128,1,32,balanced,0.1474240024884542
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,2048,768,8,128,1,32,balanced,0.10427199800809224
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,2048,768,8,128,1,32,balanced,0.045082668463389076
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,2048,768,8,128,1,32,power_law_1.01,0.025593599677085875
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,2048,768,8,128,1,32,power_law_1.01,0.0253248006105423
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,2048,768,8,128,1,32,balanced,0.04832000037034353
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,2048,768,8,128,1,32,balanced,0.11919466654459636
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,2048,768,8,128,1,32,power_law_1.01,0.026105600595474242
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,2048,768,8,128,1,32,power_law_1.01,0.026956799626350402
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,2048,768,8,128,1,32,power_law_1.01,0.02757120132446289
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,2048,768,8,128,1,32,power_law_1.01,0.027846398949623107
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,2048,768,8,128,1,32,balanced,0.16616533199946085
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,2048,768,8,128,1,32,power_law_1.01,0.02821120023727417
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,2048,768,8,128,1,32,balanced,0.06391466657320659
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,2048,768,8,128,1,32,power_law_1.01,0.029190400242805482
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,2048,768,8,128,1,32,balanced,0.16595199704170227
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,2048,768,8,128,1,32,power_law_1.01,0.03310079872608185
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,2048,768,8,128,1,32,power_law_1.01,0.03680639863014221
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,2048,768,8,128,1,32,balanced,0.07162133355935414
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,2048,768,8,128,1,32,power_law_1.01,0.033990401029586795
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,2048,768,8,128,1,32,power_law_1.01,0.034841600060462954
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,2048,768,8,128,1,32,power_law_1.01,0.032576000690460204
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,2048,768,8,128,1,32,power_law_1.01,0.03797760009765625
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,2048,768,8,128,1,32,power_law_1.01,0.03188480138778686
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,2048,768,8,128,1,32,power_law_1.01,0.024607999622821806
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,2048,768,8,128,1,32,power_law_1.01,0.03779839873313904
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,2048,768,8,128,1,32,power_law_1.01,0.032128000259399415
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,2048,768,8,128,1,32,power_law_1.01,0.023680000007152556
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,2048,768,8,128,1,32,power_law_1.01,0.04364160001277924
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,2048,768,8,128,1,32,power_law_1.01,0.032287999987602234
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,2048,768,8,128,1,32,balanced,0.20167466004689535
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,2048,768,8,128,1,32,power_law_1.01,0.023104000091552734
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,2048,768,8,128,1,32,power_law_1.01,0.034272000193595886
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,2048,768,8,128,1,32,power_law_1.01,0.04932479858398438
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,2048,768,8,128,1,32,power_law_1.01,0.025760000944137572
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,2048,768,8,128,1,32,power_law_1.01,0.034169599413871765
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,2048,768,8,128,1,32,power_law_1.01,0.05185920000076294
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,2048,768,8,128,1,32,power_law_1.01,0.02625280022621155
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,2048,768,8,128,1,32,power_law_1.01,0.034585601091384886
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,2048,768,8,128,1,32,power_law_1.01,0.05006719827651977
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,2048,768,8,128,1,32,balanced,0.09467732906341553
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,2048,768,8,128,1,32,power_law_1.01,0.027385601401329042
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,2048,768,8,128,1,32,power_law_1.01,0.03516159951686859
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,2048,768,8,128,1,32,power_law_1.01,0.05512319803237915
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,2048,768,8,128,1,32,balanced,0.23783467213312784
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,2048,768,8,128,1,32,power_law_1.01,0.027551999688148497
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,2048,768,8,128,1,32,power_law_1.01,0.03555200099945068
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,2048,768,8,128,1,32,power_law_1.01,0.0667136013507843
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,2048,768,8,128,1,32,power_law_1.01,0.02800000011920929
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,2048,768,8,128,1,32,power_law_1.01,0.036550399661064145
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,2048,768,8,128,1,32,power_law_1.01,0.08028159737586975
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,2048,768,8,128,1,32,power_law_1.01,0.028115200996398925
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,2048,768,8,128,1,32,balanced,0.11374933520952861
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,2048,768,8,128,1,32,power_law_1.01,0.037036800384521486
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,2048,768,8,128,1,32,power_law_1.01,0.08145920038223267
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,2048,768,8,128,1,32,power_law_1.01,0.028204798698425293
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,2048,768,8,128,1,32,power_law_1.01,0.029868799448013305
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,2048,768,8,128,1,32,power_law_1.01,0.03946239948272705
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,2048,768,8,128,1,32,power_law_1.01,0.10138239860534667
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,2048,768,8,128,1,32,balanced,0.2359093427658081
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,2048,768,8,128,1,32,power_law_1.01,0.030700799822807313
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,2048,768,8,128,1,32,power_law_1.01,0.039654400944709775
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,2048,768,8,128,1,32,power_law_1.01,0.11509759426116943
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,2048,768,8,128,1,32,power_law_1.01,0.03312000036239624
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,2048,768,8,128,1,32,power_law_1.01,0.044172799587249754
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,2048,768,8,128,1,32,power_law_1.01,0.16664960384368896
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,2048,768,8,128,1,32,power_law_1.01,0.0379967987537384
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,2048,768,8,128,1,32,power_law_1.01,0.04503679871559143
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,2048,768,8,128,1,32,power_law_1.01,0.2012928009033203
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,2048,768,8,128,1,32,power_law_1.01,0.041145598888397215
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,2048,768,8,128,1,32,balanced,0.15836800138155618
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,2048,768,8,128,1,32,power_law_1.01,0.0521664023399353
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,2048,768,8,128,1,32,power_law_1.01,0.04328320026397705
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,2048,768,8,128,1,32,power_law_1.01,0.2504256010055542
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,2048,768,8,128,1,32,power_law_1.01,0.05983999967575073
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,2048,768,8,128,1,32,power_law_1.01,0.3148672103881836
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,2048,768,8,128,1,32,power_law_1.01,0.06002560257911682
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,2048,768,8,128,1,32,power_law_1.01,0.04410240054130554
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,2048,768,8,128,1,32,power_law_1.01,0.41636481285095217
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,2048,768,8,128,1,32,power_law_1.01,0.07173759937286377
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,2048,768,8,128,1,32,power_law_1.01,0.05942400097846985
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,2048,768,8,128,1,32,power_law_1.01,0.08006399869918823
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,2048,768,8,128,1,32,power_law_1.01,0.5977280139923096
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,2048,768,8,128,1,32,power_law_1.01,0.06888960003852844
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,2048,768,8,128,1,32,power_law_1.01,0.10672639608383179
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,2048,768,8,128,1,32,power_law_1.01,1.4567808151245116
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,2048,768,8,128,1,32,power_law_1.01,0.12072319984436035
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,2048,768,8,128,1,32,balanced,0.1990613341331482
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,2048,768,8,128,1,32,power_law_1.01,0.15467519760131837
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,2048,768,8,128,1,32,power_law_1.01,0.07504640221595764
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,2048,768,8,128,1,32,power_law_1.01,0.2297600030899048
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,2048,768,8,128,1,32,power_law_1.01,0.09259520173072815
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,2048,768,8,128,1,32,balanced,0.35313065846761066
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,2048,768,8,128,1,32,power_law_1.01,0.30013439655303953
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,2048,768,8,128,1,32,power_law_1.01,0.12099839448928833
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,2048,768,8,128,1,32,power_law_1.01,0.3605184078216553
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,2048,768,8,128,1,32,power_law_1.01,0.14257919788360596
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,2048,768,8,128,1,32,power_law_1.01,0.495084810256958
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,2048,768,8,128,1,32,power_law_1.01,0.7621503829956054
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,2048,768,8,128,1,32,power_law_1.01,0.2537600040435791
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,2048,768,8,128,1,32,power_law_1.01,1.569536018371582
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,2048,768,8,128,1,32,power_law_1.01,0.2735680103302002
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,2048,768,8,128,1,32,balanced,0.4385066827138265
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,2048,768,8,128,1,32,power_law_1.2,0.026572799682617186
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,2048,768,8,128,1,32,power_law_1.2,0.03621760010719299
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,2048,768,8,128,1,32,power_law_1.01,0.38005120754241944
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,2048,768,8,128,1,32,power_law_1.2,0.026688000559806822
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,2048,768,8,128,1,32,power_law_1.2,0.03184640109539032
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,2048,768,8,128,1,32,power_law_1.01,0.6594240188598632
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,2048,768,8,128,1,32,balanced,0.2456586758295695
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,2048,768,8,128,1,32,power_law_1.2,0.026054400205612182
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,2048,768,8,128,1,32,power_law_1.2,0.0318336009979248
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,2048,768,8,128,1,32,power_law_1.2,0.028972798585891725
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,2048,768,8,128,1,32,power_law_1.2,0.03196159899234772
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,2048,768,8,128,1,32,power_law_1.01,0.6639999866485595
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,2048,768,8,128,1,32,power_law_1.2,0.029177600145339967
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,2048,768,8,128,1,32,power_law_1.2,0.032416000962257385
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,2048,768,8,128,1,32,power_law_1.2,0.02927359938621521
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,2048,768,8,128,1,32,power_law_1.01,1.161843204498291
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,2048,768,8,128,1,32,power_law_1.2,0.034092798829078674
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,2048,768,8,128,1,32,power_law_1.2,0.03374080061912536
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,2048,768,8,128,1,32,power_law_1.2,0.03454720079898834
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,2048,768,8,128,1,32,power_law_1.01,2.4136192321777346
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,2048,768,8,128,1,32,power_law_1.2,0.03521279990673065
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,2048,768,8,128,1,32,power_law_1.2,0.03514240086078644
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,2048,768,8,128,1,32,power_law_1.2,0.035155200958251955
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,2048,768,8,128,1,32,power_law_1.2,0.033580800890922545
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,2048,768,8,128,1,32,power_law_1.2,0.03550080060958862
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,2048,768,8,128,1,32,power_law_1.2,0.035750401020050046
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,2048,768,8,128,1,32,power_law_1.2,0.03654400110244751
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,2048,768,8,128,1,32,power_law_1.2,0.03687680065631867
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,2048,768,8,128,1,32,power_law_1.2,0.03866240084171295
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,2048,768,8,128,1,32,power_law_1.2,0.03827199935913086
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,2048,768,8,128,1,32,power_law_1.2,0.042656001448631284
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,2048,768,8,128,1,32,power_law_1.2,0.042316800355911253
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,2048,768,8,128,1,32,power_law_1.2,0.04080640077590943
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,2048,768,8,128,1,32,balanced,0.3951946496963501
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,2048,768,8,128,1,32,power_law_1.2,0.046489599347114566
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,2048,768,8,128,1,32,power_law_1.2,0.047577598690986635
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,2048,768,8,128,1,32,power_law_1.2,0.050374400615692136
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,2048,768,8,128,1,32,power_law_1.2,0.05141760110855102
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,2048,768,8,128,1,32,power_law_1.2,0.05489280223846436
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,2048,768,8,128,1,32,balanced,0.6720693111419678
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,2048,768,8,128,1,32,power_law_1.2,0.05051519870758057
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,2048,768,8,128,1,32,power_law_1.2,0.05330560207366943
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,2048,768,8,128,1,32,power_law_1.2,0.0664896011352539
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,2048,768,8,128,1,32,power_law_1.2,0.06392319798469544
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,2048,768,8,128,1,32,power_law_1.2,0.06837760210037232
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,2048,768,8,128,1,32,power_law_1.2,0.06764159798622131
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,2048,768,8,128,1,32,power_law_1.2,0.08580480217933655
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,2048,768,8,128,1,32,power_law_1.2,0.08359040021896362
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,2048,768,8,128,1,32,power_law_1.2,0.0893567979335785
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,2048,768,8,128,1,32,power_law_1.2,0.09882879853248597
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,2048,768,8,128,1,32,power_law_1.2,0.121561598777771
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,2048,768,8,128,1,32,power_law_1.2,0.1223296046257019
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,2048,768,8,128,1,32,power_law_1.2,0.13745280504226684
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,2048,768,8,128,1,32,power_law_1.2,0.13896960020065308
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,2048,768,8,128,1,32,power_law_1.2,0.2434688091278076
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,2048,768,8,128,1,32,power_law_1.2,0.22155520915985108
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,2048,768,8,128,1,32,power_law_1.2,0.28488960266113283
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,2048,768,8,128,1,32,power_law_1.2,0.272326397895813
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,2048,768,8,128,1,32,power_law_1.2,0.39304959774017334
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,2048,768,8,128,1,32,power_law_1.2,0.35364480018615724
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,2048,768,8,128,1,32,power_law_1.2,0.49541759490966797
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,2048,768,8,128,1,32,power_law_1.2,0.5379583835601807
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,2048,768,8,128,1,32,power_law_1.2,0.8033984184265137
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,2048,768,8,128,1,32,power_law_1.2,0.7078271865844726
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,2048,768,8,128,1,32,power_law_1.2,1.2514240264892578
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,2048,768,8,128,1,32,power_law_1.2,1.255737590789795
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,2048,768,8,128,1,32,power_law_1.2,3.3727294921875
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,2048,768,8,128,1,32,power_law_1.2,2.9373184204101563
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,2048,768,8,128,1,32,balanced,0.7810133298238119
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,2048,768,8,128,1,32,power_law_1.2,0.025491198897361754
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,2048,768,8,128,1,32,power_law_1.2,0.02327679991722107
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,2048,768,8,128,1,32,power_law_1.2,0.0234047994017601
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,2048,768,8,128,2,16,balanced,0.022661333282788593
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,2048,768,8,128,1,32,power_law_1.2,0.026579201221466064
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,2048,768,8,128,2,16,balanced,0.0229120006163915
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,2048,768,8,128,1,32,power_law_1.2,0.027270400524139406
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,2048,768,8,128,2,16,balanced,0.030037333567937214
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,2048,768,8,128,2,16,balanced,0.02314666658639908
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,2048,768,8,128,2,16,balanced,0.02497066557407379
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,2048,768,8,128,1,32,power_law_1.2,0.028492799401283263
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,2048,768,8,128,2,16,balanced,0.029658667743206024
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,2048,768,8,128,2,16,balanced,0.027589333554108936
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,2048,768,8,128,1,32,power_law_1.2,0.028569599986076354
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,2048,768,8,128,2,16,balanced,0.0281333327293396
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,2048,768,8,128,2,16,balanced,0.030453334252039593
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,2048,768,8,128,2,16,balanced,0.029301332930723827
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,2048,768,8,128,1,32,power_law_1.2,0.02892799973487854
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,2048,768,8,128,2,16,balanced,0.032144000132878624
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,2048,768,8,128,2,16,balanced,0.02917333443959554
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,2048,768,8,128,1,32,power_law_1.2,0.028960001468658448
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,2048,768,8,128,2,16,balanced,0.027952000498771667
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,2048,768,8,128,2,16,balanced,0.03443733354409536
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,2048,768,8,128,2,16,balanced,0.03130666663249334
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,2048,768,8,128,1,32,power_law_1.2,0.02917119860649109
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,2048,768,8,128,2,16,balanced,0.03310399999221166
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,2048,768,8,128,2,16,balanced,0.03543466577927271
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,2048,768,8,128,2,16,balanced,0.033946665624777474
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,2048,768,8,128,1,32,power_law_1.2,0.030393600463867188
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,2048,768,8,128,2,16,balanced,0.03532266616821289
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,2048,768,8,128,2,16,balanced,0.03431999931732813
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,2048,768,8,128,1,32,power_law_1.2,0.03158400058746338
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,2048,768,8,128,2,16,balanced,0.035402665535608925
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,2048,768,8,128,2,16,balanced,0.033733333150545754
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,2048,768,8,128,1,32,power_law_1.2,0.03356159925460815
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,2048,768,8,128,2,16,balanced,0.03885866701602936
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,2048,768,8,128,2,16,balanced,0.03526933242877325
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,2048,768,8,128,2,16,balanced,0.042730664213498436
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,2048,768,8,128,2,16,balanced,0.035616000493367515
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,2048,768,8,128,1,32,power_law_1.2,0.03829759955406189
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,2048,768,8,128,2,16,balanced,0.04030933231115341
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,2048,768,8,128,2,16,balanced,0.03621333340803782
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,2048,768,8,128,1,32,power_law_1.2,0.0440447986125946
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,2048,768,8,128,2,16,balanced,0.050794666012128196
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,2048,768,8,128,2,16,balanced,0.023770667612552643
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,2048,768,8,128,2,16,balanced,0.03590933233499527
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,2048,768,8,128,1,32,power_law_1.2,0.04525440037250519
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,2048,768,8,128,2,16,balanced,0.04629333317279816
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,2048,768,8,128,2,16,balanced,0.036933332681655884
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,2048,768,8,128,2,16,balanced,0.02387733260790507
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,2048,768,8,128,2,16,balanced,0.05630399783452352
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,2048,768,8,128,2,16,balanced,0.02438933402299881
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,2048,768,8,128,2,16,balanced,0.03843733419974645
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,2048,768,8,128,1,32,power_law_1.2,0.051123201847076416
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,2048,768,8,128,2,16,balanced,0.02621866762638092
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,2048,768,8,128,2,16,balanced,0.056277334690093994
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,2048,768,8,128,2,16,balanced,0.04062933226426443
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,2048,768,8,128,1,32,power_law_1.2,0.061919999122619626
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,2048,768,8,128,2,16,balanced,0.027610667049884796
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,2048,768,8,128,2,16,balanced,0.039877332746982574
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,2048,768,8,128,1,32,power_law_1.2,0.07539839744567871
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,2048,768,8,128,2,16,balanced,0.02871999889612198
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,2048,768,8,128,2,16,balanced,0.06746666630109151
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,2048,768,8,128,2,16,balanced,0.04085866610209147
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,2048,768,8,128,2,16,balanced,0.028837333122889202
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,2048,768,8,128,2,16,balanced,0.02898666759332021
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,2048,768,8,128,2,16,balanced,0.04696000119050344
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,2048,768,8,128,2,16,balanced,0.07131200035413106
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,2048,768,8,128,2,16,balanced,0.02884799987077713
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,2048,768,8,128,1,32,power_law_1.2,0.10087039470672607
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,2048,768,8,128,2,16,balanced,0.02958933264017105
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,2048,768,8,128,2,16,balanced,0.04650133351484934
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,2048,768,8,128,1,32,power_law_1.2,0.11534080505371094
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,2048,768,8,128,2,16,power_law_1.01,0.027718400955200194
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,2048,768,8,128,2,16,balanced,0.029696000119050343
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,2048,768,8,128,2,16,balanced,0.030623999734719593
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,2048,768,8,128,2,16,balanced,0.09381866455078125
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,2048,768,8,128,2,16,balanced,0.05494399865468343
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,2048,768,8,128,1,32,power_law_1.2,0.14547200202941896
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,2048,768,8,128,2,16,balanced,0.03139200061559677
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,2048,768,8,128,2,16,power_law_1.01,0.024435199797153473
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,2048,768,8,128,2,16,balanced,0.031632001201311745
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,2048,768,8,128,1,32,power_law_1.2,0.18691200017929077
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,2048,768,8,128,2,16,power_law_1.01,0.024607999622821806
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,2048,768,8,128,2,16,balanced,0.06097066899140676
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,2048,768,8,128,2,16,power_law_1.01,0.026387199759483337
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,2048,768,8,128,2,16,power_law_1.01,0.029977598786354066
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,2048,768,8,128,2,16,balanced,0.03629333277543386
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,2048,768,8,128,2,16,balanced,0.10099732875823975
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,2048,768,8,128,2,16,power_law_1.01,0.029120001196861266
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,2048,768,8,128,2,16,balanced,0.07730666796366374
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,2048,768,8,128,1,32,power_law_1.2,0.30653440952301025
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,2048,768,8,128,2,16,power_law_1.01,0.03054080009460449
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,2048,768,8,128,2,16,balanced,0.037471999724706016
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,2048,768,8,128,1,32,power_law_1.2,0.5026495933532715
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,2048,768,8,128,2,16,power_law_1.01,0.03054080009460449
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,2048,768,8,128,2,16,power_law_1.01,0.031763198971748355
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,2048,768,8,128,1,32,power_law_1.2,0.6909567832946777
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,2048,768,8,128,2,16,balanced,0.08591467142105103
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,2048,768,8,128,2,16,power_law_1.01,0.03500800132751465
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,2048,768,8,128,1,32,power_law_1.2,0.909823989868164
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,2048,768,8,128,2,16,power_law_1.01,0.04071039855480194
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,2048,768,8,128,2,16,power_law_1.01,0.04074240028858185
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,2048,768,8,128,2,16,balanced,0.03745066622893015
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,2048,768,8,128,2,16,power_law_1.01,0.042368000745773314
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,2048,768,8,128,2,16,balanced,0.14814399679501852
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,2048,768,8,128,1,32,power_law_1.2,1.1454848289489745
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,2048,768,8,128,2,16,balanced,0.11649066209793091
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,2048,768,8,128,2,16,power_law_1.01,0.04302720129489899
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,2048,768,8,128,2,16,balanced,0.04141333450873693
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,2048,768,8,128,2,16,power_law_1.01,0.04627839922904968
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,2048,768,8,128,1,32,power_law_1.2,2.188620758056641
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,2048,768,8,128,2,16,power_law_1.01,0.04917759895324707
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,2048,768,8,128,2,16,power_law_1.01,0.038412800431251524
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,2048,768,8,128,2,16,balanced,0.04318400224049886
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,2048,768,8,128,2,16,power_law_1.01,0.05615360140800476
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,2048,768,8,128,1,32,power_law_1.2,4.9353984832763675
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,2048,768,8,128,2,16,power_law_1.01,0.06652160286903382
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,2048,768,8,128,2,16,power_law_1.01,0.03247359991073608
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,2048,768,8,128,2,16,power_law_1.01,0.06392319798469544
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,2048,768,8,128,2,16,power_law_1.01,0.0302592009305954
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,2048,768,8,128,2,16,balanced,0.13407466808954874
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,2048,768,8,128,2,16,power_law_1.01,0.07147520184516906
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,2048,768,8,128,2,16,power_law_1.01,0.03219839930534363
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,2048,768,8,128,2,16,power_law_1.01,0.08161280155181885
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,2048,768,8,128,2,16,balanced,0.0525493323802948
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,2048,768,8,128,2,16,power_law_1.01,0.09249920248985291
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,2048,768,8,128,2,16,power_law_1.01,0.03258239924907684
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,2048,768,8,128,2,16,balanced,0.17497066656748453
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,2048,768,8,128,2,16,power_law_1.01,0.11431679725646973
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,2048,768,8,128,2,16,balanced,0.05916266640027364
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,2048,768,8,128,2,16,power_law_1.01,0.033817601203918454
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,2048,768,8,128,2,16,power_law_1.01,0.14631680250167847
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,2048,768,8,128,2,16,power_law_1.01,0.03447040021419525
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,2048,768,8,128,2,16,power_law_1.01,0.17424000501632692
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,2048,768,8,128,2,16,power_law_1.01,0.26319360733032227
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,2048,768,8,128,2,16,power_law_1.01,0.03495039939880371
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,2048,768,8,128,2,16,power_law_1.2,0.02653439939022064
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,2048,768,8,128,2,16,balanced,0.18999467293421426
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,2048,768,8,128,2,16,power_law_1.01,0.3241280078887939
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,2048,768,8,128,2,16,power_law_1.01,0.03598720133304596
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,2048,768,8,128,2,16,power_law_1.01,0.395417594909668
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,2048,768,8,128,2,16,power_law_1.2,0.022700800001621245
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,2048,768,8,128,2,16,power_law_1.01,0.03616639971733093
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,2048,768,8,128,2,16,power_law_1.01,0.6309120178222656
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,2048,768,8,128,2,16,power_law_1.2,0.024198399484157564
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,2048,768,8,128,2,16,balanced,0.07892799874146779
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,2048,768,8,128,2,16,power_law_1.01,0.027084800601005554
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,2048,768,8,128,2,16,power_law_1.01,0.03731839954853058
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,2048,768,8,128,2,16,power_law_1.01,1.1449664115905762
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,2048,768,8,128,2,16,power_law_1.2,0.024358400702476503
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,2048,768,8,128,2,16,power_law_1.01,0.024512000381946564
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,2048,768,8,128,2,16,power_law_1.01,0.03768320083618164
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,2048,768,8,128,2,16,power_law_1.2,0.02720000147819519
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,2048,768,8,128,2,16,balanced,0.20267732938130698
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,2048,768,8,128,2,16,balanced,0.0897653301556905
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,2048,768,8,128,2,16,power_law_1.01,0.024358400702476503
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,2048,768,8,128,2,16,power_law_1.01,0.039315199851989745
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,2048,768,8,128,2,16,power_law_1.2,0.028870400786399842
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,2048,768,8,128,2,16,power_law_1.01,0.026624000072479247
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,2048,768,8,128,2,16,power_law_1.01,0.04199039936065674
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,2048,768,8,128,2,16,power_law_1.2,0.02901119887828827
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,2048,768,8,128,2,16,balanced,0.2367466688156128
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,2048,768,8,128,2,16,power_law_1.01,0.027475199103355406
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,2048,768,8,128,2,16,power_law_1.01,0.04567680060863495
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,2048,768,8,128,2,16,power_law_1.2,0.03127039968967438
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,2048,768,8,128,2,16,power_law_1.01,0.02895359992980957
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,2048,768,8,128,2,16,power_law_1.01,0.04676479995250702
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,2048,768,8,128,2,16,power_law_1.2,0.032793599367141726
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,2048,768,8,128,2,16,power_law_1.01,0.050367999076843264
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,2048,768,8,128,2,16,power_law_1.01,0.029017600417137145
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,2048,768,8,128,2,16,power_law_1.2,0.03436160087585449
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,2048,768,8,128,2,16,balanced,0.12211733063062032
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,2048,768,8,128,2,16,power_law_1.01,0.05971199870109558
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,2048,768,8,128,2,16,power_law_1.2,0.03986560106277466
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,2048,768,8,128,2,16,power_law_1.01,0.029548799991607665
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,2048,768,8,128,2,16,power_law_1.2,0.040678399801254275
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,2048,768,8,128,2,16,power_law_1.01,0.05998079776763916
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,2048,768,8,128,2,16,power_law_1.01,0.030380800366401672
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,2048,768,8,128,2,16,power_law_1.2,0.042656001448631284
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,2048,768,8,128,2,16,power_law_1.01,0.07330560088157653
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,2048,768,8,128,2,16,power_law_1.01,0.03118079900741577
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,2048,768,8,128,2,16,power_law_1.01,0.08387839794158936
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,2048,768,8,128,2,16,power_law_1.2,0.04327679872512817
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,2048,768,8,128,2,16,power_law_1.01,0.0328575998544693
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,2048,768,8,128,2,16,balanced,0.14924266934394836
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,2048,768,8,128,2,16,power_law_1.01,0.10604159832000733
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,2048,768,8,128,2,16,power_law_1.2,0.04780159890651703
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,2048,768,8,128,2,16,power_law_1.01,0.03409920036792755
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,2048,768,8,128,2,16,balanced,0.2794933319091797
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,2048,768,8,128,2,16,power_law_1.01,0.12645119428634644
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,2048,768,8,128,2,16,power_law_1.2,0.04962559938430786
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,2048,768,8,128,2,16,power_law_1.01,0.035571199655532834
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,2048,768,8,128,2,16,balanced,0.30535467465718585
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,2048,768,8,128,2,16,power_law_1.01,0.17063679695129394
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,2048,768,8,128,2,16,power_law_1.2,0.05761920213699341
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,2048,768,8,128,2,16,power_law_1.01,0.03861120045185089
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,2048,768,8,128,2,16,power_law_1.01,0.23508479595184326
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,2048,768,8,128,2,16,power_law_1.2,0.06986240148544312
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,2048,768,8,128,2,16,power_law_1.01,0.041503998637199405
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,2048,768,8,128,2,16,power_law_1.01,0.28628480434417725
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,2048,768,8,128,2,16,power_law_1.2,0.06458879709243774
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,2048,768,8,128,2,16,balanced,0.21663999557495117
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,2048,768,8,128,2,16,power_law_1.01,0.045049598813056944
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,2048,768,8,128,2,16,power_law_1.01,0.4248511791229248
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,2048,768,8,128,2,16,power_law_1.2,0.08683519959449768
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,2048,768,8,128,2,16,power_law_1.01,0.49465599060058596
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,2048,768,8,128,2,16,power_law_1.2,0.09291520118713378
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,2048,768,8,128,2,16,power_law_1.2,0.12164479494094849
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,2048,768,8,128,2,16,power_law_1.01,0.7398911952972412
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,2048,768,8,128,2,16,power_law_1.01,0.04907520115375519
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,2048,768,8,128,2,16,power_law_1.2,0.13996800184249877
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,2048,768,8,128,2,16,power_law_1.01,0.05735039710998535
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,2048,768,8,128,2,16,power_law_1.01,1.4913984298706056
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,2048,768,8,128,2,16,power_law_1.01,0.06726400256156921
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,2048,768,8,128,2,16,power_law_1.2,0.17489919662475586
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,2048,768,8,128,2,16,balanced,0.29237866401672363
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,2048,768,8,128,2,16,power_law_1.2,0.25236480236053466
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,2048,768,8,128,2,16,power_law_1.01,0.07686399817466735
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,2048,768,8,128,2,16,power_law_1.2,0.3116735935211182
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,2048,768,8,128,2,16,power_law_1.01,0.09379839897155762
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,2048,768,8,128,2,16,balanced,0.43562134106953937
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,2048,768,8,128,2,16,power_law_1.2,0.4565120220184326
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,2048,768,8,128,2,16,power_law_1.2,0.5932864189147949
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,2048,768,8,128,2,16,power_law_1.01,0.12088320255279542
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,2048,768,8,128,2,16,power_law_1.2,0.9095487594604492
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,2048,768,8,128,2,16,power_law_1.01,0.15493119955062867
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,2048,768,8,128,2,16,power_law_1.2,2.1295167922973635
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,2048,768,8,128,2,16,power_law_1.01,0.23253118991851807
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,2048,768,8,128,2,16,balanced,0.36101865768432617
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,2048,768,8,128,2,16,power_law_1.01,0.27799038887023925
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,2048,768,8,128,2,16,power_law_1.01,0.4764095783233643
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,2048,768,8,128,2,16,power_law_1.01,0.5395071983337403
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,2048,768,8,128,2,16,power_law_1.01,0.7022655963897705
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,2048,768,8,128,2,16,balanced,0.5633546511332194
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,2048,768,8,128,2,16,power_law_1.01,1.2849535942077637
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,2048,768,8,128,2,16,power_law_1.01,2.185958480834961
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,2048,768,8,128,2,16,balanced,0.5568480094273885
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,2048,768,8,128,2,16,balanced,0.8420906861623129
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,2048,768,8,128,2,16,power_law_1.2,0.03727999925613403
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,2048,768,8,128,2,16,power_law_1.2,0.030432000756263733
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,2048,768,8,128,2,16,power_law_1.2,0.03272959887981415
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,2048,768,8,128,2,16,balanced,1.098581314086914
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,2048,768,8,128,2,16,power_law_1.2,0.03189760148525238
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,2048,768,8,128,2,16,power_law_1.2,0.03242239952087402
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,2048,768,8,128,2,16,power_law_1.2,0.034720000624656674
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,2048,768,8,128,2,16,power_law_1.2,0.03450239896774292
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,2048,768,8,128,2,16,power_law_1.2,0.036211198568344115
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,2048,768,8,128,2,16,power_law_1.2,0.037088000774383546
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,2048,768,8,128,2,16,power_law_1.2,0.036697599291801455
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,2048,768,8,128,2,16,power_law_1.2,0.027084800601005554
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,2048,768,8,128,2,16,power_law_1.2,0.03751679956912994
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,2048,768,8,128,2,16,power_law_1.2,0.024268800020217897
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,2048,768,8,128,2,16,power_law_1.2,0.03790720105171204
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,2048,768,8,128,2,16,power_law_1.2,0.02444159984588623
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,2048,768,8,128,2,16,power_law_1.2,0.039724799990653994
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,2048,768,8,128,2,16,power_law_1.2,0.0263808012008667
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,2048,768,8,128,2,16,power_law_1.2,0.042316800355911253
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,2048,768,8,128,2,16,power_law_1.2,0.027647998929023743
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,2048,768,8,128,2,16,power_law_1.2,0.047116801142692566
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,2048,768,8,128,2,16,power_law_1.2,0.029075199365615846
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,2048,768,8,128,2,16,power_law_1.2,0.02908799946308136
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,2048,768,8,128,2,16,power_law_1.2,0.04782719910144806
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,2048,768,8,128,2,16,power_law_1.2,0.030527999997138976
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,2048,768,8,128,2,16,power_law_1.2,0.05110399723052979
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,2048,768,8,128,2,16,power_law_1.2,0.03160960078239441
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,2048,768,8,128,2,16,power_law_1.2,0.06305919885635376
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,2048,768,8,128,2,16,power_law_1.2,0.03284479975700379
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,2048,768,8,128,2,16,power_law_1.2,0.06584960222244263
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,2048,768,8,128,2,16,power_law_1.2,0.032691198587417605
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,2048,768,8,128,2,16,power_law_1.2,0.07950080037117005
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,2048,768,8,128,2,16,power_law_1.2,0.034329599142074584
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,2048,768,8,128,2,16,power_law_1.2,0.09149439930915833
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,2048,768,8,128,2,16,power_law_1.2,0.03596160113811493
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,2048,768,8,128,2,16,power_law_1.2,0.12703360319137574
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,2048,768,8,128,2,16,power_law_1.2,0.040652799606323245
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,2048,768,8,128,2,16,power_law_1.2,0.143231999874115
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,2048,768,8,128,2,16,power_law_1.2,0.20556800365447997
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,2048,768,8,128,2,16,power_law_1.2,0.04471679925918579
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,2048,768,8,128,2,16,power_law_1.2,0.2542464017868042
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,2048,768,8,128,2,16,power_law_1.2,0.04565120041370392
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,2048,768,8,128,2,16,power_law_1.2,0.3739903926849365
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,2048,768,8,128,4,8,balanced,0.022997332115968067
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,2048,768,8,128,2,16,power_law_1.2,0.6040256023406982
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,2048,768,8,128,2,16,power_law_1.2,0.048979198932647704
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,2048,768,8,128,4,8,balanced,0.022426667312781017
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,2048,768,8,128,2,16,power_law_1.2,0.6349887847900391
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,2048,768,8,128,4,8,balanced,0.022533332308133442
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,2048,768,8,128,2,16,power_law_1.2,0.06461439728736877
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,2048,768,8,128,4,8,balanced,0.025413334369659424
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,2048,768,8,128,2,16,power_law_1.2,1.4281599998474122
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,2048,768,8,128,2,16,power_law_1.2,0.07242879867553711
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,2048,768,8,128,4,8,balanced,0.026687999566396076
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,2048,768,8,128,4,8,balanced,0.027845333019892376
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,2048,768,8,128,2,16,power_law_1.2,2.281318473815918
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,2048,768,8,128,4,8,balanced,0.028064000109831493
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,2048,768,8,128,2,16,power_law_1.2,0.08344320058822632
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,2048,768,8,128,4,8,balanced,0.028058665494124096
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,2048,768,8,128,2,16,power_law_1.2,0.10668799877166749
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,2048,768,8,128,4,8,balanced,0.03047466774781545
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,2048,768,8,128,4,8,balanced,0.02773333340883255
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,2048,768,8,128,4,8,balanced,0.02899733434120814
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,2048,768,8,128,4,8,balanced,0.029898665845394135
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,2048,768,8,128,2,16,power_law_1.2,0.15030399560928345
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,2048,768,8,128,4,8,balanced,0.031744000812371574
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,2048,768,8,128,4,8,balanced,0.03121600051720937
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,2048,768,8,128,2,16,power_law_1.2,0.17711360454559327
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,2048,768,8,128,4,8,balanced,0.031445334355036415
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,2048,768,8,128,4,8,balanced,0.033701332906881966
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,2048,768,8,128,4,8,balanced,0.030378667016824085
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,2048,768,8,128,4,8,balanced,0.036757332583268486
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,2048,768,8,128,2,16,power_law_1.2,0.2825023889541626
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,2048,768,8,128,4,8,balanced,0.035242666800816856
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,2048,768,8,128,4,8,balanced,0.03718933214743932
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,2048,768,8,128,2,16,power_law_1.2,0.37793920040130613
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,2048,768,8,128,4,8,balanced,0.03998400022586187
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,2048,768,8,128,4,8,balanced,0.03755733370780945
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,2048,768,8,128,2,16,power_law_1.2,0.8124863624572753
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,2048,768,8,128,4,8,balanced,0.04312533140182495
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,2048,768,8,128,4,8,balanced,0.03742400060097376
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,2048,768,8,128,4,8,balanced,0.04292266567548116
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,2048,768,8,128,2,16,power_law_1.2,0.9546048164367675
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,2048,768,8,128,4,8,balanced,0.03749866783618927
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,2048,768,8,128,4,8,balanced,0.0543039987484614
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,2048,768,8,128,4,8,balanced,0.0377866675456365
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,2048,768,8,128,2,16,power_law_1.2,1.0634048461914063
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,2048,768,8,128,4,8,balanced,0.049839998284975685
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,2048,768,8,128,4,8,balanced,0.03805333375930786
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,2048,768,8,128,2,16,power_law_1.2,1.7730752944946289
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,2048,768,8,128,4,8,balanced,0.03859733293453852
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,2048,768,8,128,4,8,balanced,0.06137600044409434
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,2048,768,8,128,4,8,balanced,0.025098666548728943
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,2048,768,8,128,4,8,balanced,0.03942933430274328
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,2048,768,8,128,2,16,power_law_1.2,4.744192123413086
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,2048,768,8,128,4,8,balanced,0.06544533371925354
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,2048,768,8,128,4,8,balanced,0.02603200078010559
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,2048,768,8,128,4,8,balanced,0.03989866624275843
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,2048,768,8,128,4,8,power_law_1.01,0.025920000672340394
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,2048,768,8,128,4,8,balanced,0.026661333938439686
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,2048,768,8,128,4,8,balanced,0.04330133398373922
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,2048,768,8,128,4,8,balanced,0.028463999430338543
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,2048,768,8,128,4,8,balanced,0.07999466856320699
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,2048,768,8,128,4,8,power_law_1.01,0.023423999547958374
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,2048,768,8,128,4,8,balanced,0.04332800209522247
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,2048,768,8,128,4,8,power_law_1.01,0.022726400196552275
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,2048,768,8,128,4,8,balanced,0.032138665517171226
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,2048,768,8,128,4,8,power_law_1.01,0.027980801463127137
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,2048,768,8,128,4,8,balanced,0.044480000933011375
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,2048,768,8,128,4,8,balanced,0.03292266776164373
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,2048,768,8,128,4,8,power_law_1.01,0.026412799954414368
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,2048,768,8,128,4,8,balanced,0.0839359958966573
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,2048,768,8,128,4,8,balanced,0.033029332756996155
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,2048,768,8,128,4,8,balanced,0.051130667328834534
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,2048,768,8,128,4,8,power_law_1.01,0.02800000011920929
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,2048,768,8,128,4,8,balanced,0.03287466615438461
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,2048,768,8,128,4,8,power_law_1.01,0.030028799176216127
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,2048,768,8,128,4,8,power_law_1.01,0.034457600116729735
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,2048,768,8,128,4,8,balanced,0.05128533144791921
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,2048,768,8,128,4,8,balanced,0.03347733368476232
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,2048,768,8,128,4,8,power_law_1.01,0.029836800694465638
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,2048,768,8,128,4,8,power_law_1.01,0.032102400064468385
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,2048,768,8,128,4,8,power_law_1.01,0.030329599976539612
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,2048,768,8,128,4,8,balanced,0.03405333310365677
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,2048,768,8,128,4,8,balanced,0.11409599582354228
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,2048,768,8,128,4,8,balanced,0.06171200176080068
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,2048,768,8,128,4,8,power_law_1.01,0.0339711993932724
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,2048,768,8,128,4,8,power_law_1.01,0.030681601166725157
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,2048,768,8,128,4,8,balanced,0.034245334565639496
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,2048,768,8,128,4,8,power_law_1.01,0.03632639944553375
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,2048,768,8,128,4,8,power_law_1.01,0.03317759931087494
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,2048,768,8,128,4,8,balanced,0.07161599894364674
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,2048,768,8,128,4,8,balanced,0.03531199942032496
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,2048,768,8,128,4,8,power_law_1.01,0.037254399061203
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,2048,768,8,128,4,8,power_law_1.01,0.037567999958992
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,2048,768,8,128,4,8,power_law_1.01,0.03415679931640625
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,2048,768,8,128,4,8,balanced,0.03583466758330663
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,2048,768,8,128,4,8,power_law_1.01,0.04537599980831146
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,2048,768,8,128,4,8,balanced,0.12983466188112894
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,2048,768,8,128,4,8,power_law_1.01,0.03603839874267578
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,2048,768,8,128,4,8,balanced,0.0366293340921402
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,2048,768,8,128,4,8,balanced,0.09192533294359843
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,2048,768,8,128,4,8,power_law_1.01,0.05008000135421753
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,2048,768,8,128,4,8,power_law_1.01,0.036582401394844054
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,2048,768,8,128,4,8,power_law_1.01,0.05113599896430969
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,2048,768,8,128,4,8,power_law_1.01,0.03680639863014221
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,2048,768,8,128,4,8,power_law_1.01,0.058246397972106935
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,2048,768,8,128,4,8,balanced,0.042778665820757546
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,2048,768,8,128,4,8,power_law_1.01,0.037747201323509214
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,2048,768,8,128,4,8,power_law_1.01,0.06285439729690552
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,2048,768,8,128,4,8,balanced,0.10297066966692607
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,2048,768,8,128,4,8,power_law_1.01,0.03850879967212677
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,2048,768,8,128,4,8,power_law_1.01,0.0661184012889862
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,2048,768,8,128,4,8,balanced,0.04211199780305227
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,2048,768,8,128,4,8,power_law_1.01,0.03935360014438629
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,2048,768,8,128,4,8,power_law_1.01,0.07466880083084107
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,2048,768,8,128,4,8,power_law_1.01,0.08791679739952088
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,2048,768,8,128,4,8,power_law_1.01,0.04082559943199158
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,2048,768,8,128,4,8,balanced,0.19601066907246908
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,2048,768,8,128,4,8,power_law_1.01,0.11534719467163086
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,2048,768,8,128,4,8,power_law_1.01,0.04392319917678833
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,2048,768,8,128,4,8,balanced,0.14241066575050354
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,2048,768,8,128,4,8,power_law_1.01,0.11121920347213746
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,2048,768,8,128,4,8,power_law_1.01,0.04203520119190216
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,2048,768,8,128,4,8,power_law_1.01,0.14622080326080322
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,2048,768,8,128,4,8,power_law_1.01,0.04565759897232056
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,2048,768,8,128,4,8,balanced,0.045040001471837364
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,2048,768,8,128,4,8,power_law_1.01,0.21318399906158447
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,2048,768,8,128,4,8,power_law_1.01,0.04842880070209503
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,2048,768,8,128,4,8,power_law_1.01,0.3187263965606689
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,2048,768,8,128,4,8,balanced,0.05268799761931101
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,2048,768,8,128,4,8,power_law_1.01,0.052985602617263795
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,2048,768,8,128,4,8,power_law_1.01,0.37405440807342527
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,2048,768,8,128,4,8,balanced,0.1729173262914022
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,2048,768,8,128,4,8,power_law_1.01,0.06249600052833557
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,2048,768,8,128,4,8,balanced,0.0545066644748052
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,2048,768,8,128,4,8,power_law_1.01,0.47150721549987795
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,2048,768,8,128,4,8,power_law_1.01,0.0658623993396759
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,2048,768,8,128,4,8,power_law_1.01,0.6629504203796387
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,2048,768,8,128,4,8,balanced,0.23444799582163492
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,2048,768,8,128,4,8,power_law_1.01,0.07881600260734559
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,2048,768,8,128,4,8,power_law_1.01,1.7251968383789062
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,2048,768,8,128,4,8,power_law_1.01,0.09548159837722778
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,2048,768,8,128,4,8,balanced,0.07022933165232341
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,2048,768,8,128,4,8,power_law_1.01,0.11658240556716919
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,2048,768,8,128,4,8,balanced,0.252837340037028
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,2048,768,8,128,4,8,power_law_1.01,0.14665600061416625
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,2048,768,8,128,4,8,balanced,0.08052266637484233
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,2048,768,8,128,4,8,power_law_1.01,0.18784639835357667
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,2048,768,8,128,4,8,power_law_1.01,0.23255679607391358
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,2048,768,8,128,4,8,power_law_1.01,0.027910399436950683
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,2048,768,8,128,4,8,power_law_1.01,0.3697983980178833
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,2048,768,8,128,4,8,power_law_1.01,0.026009601354599
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,2048,768,8,128,4,8,power_law_1.01,0.4568511962890625
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,2048,768,8,128,4,8,power_law_1.01,0.02650879919528961
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,2048,768,8,128,4,8,balanced,0.10752000411351521
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,2048,768,8,128,4,8,balanced,0.28933332363764447
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,2048,768,8,128,4,8,power_law_1.01,0.5754432201385498
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,2048,768,8,128,4,8,power_law_1.01,0.029254400730133058
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,2048,768,8,128,4,8,power_law_1.01,0.0304639995098114
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,2048,768,8,128,4,8,balanced,0.32180800040562946
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,2048,768,8,128,4,8,power_law_1.01,0.9055295944213867
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,2048,768,8,128,4,8,balanced,0.12506666779518127
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,2048,768,8,128,4,8,power_law_1.01,0.03213439881801605
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,2048,768,8,128,4,8,power_law_1.01,1.947929573059082
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,2048,768,8,128,4,8,power_law_1.01,0.031999999284744264
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,2048,768,8,128,4,8,power_law_1.01,0.03340800106525421
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,2048,768,8,128,4,8,power_law_1.01,0.034534400701522826
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,2048,768,8,128,4,8,power_law_1.01,0.03498240113258362
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,2048,768,8,128,4,8,power_law_1.01,0.036524799466133115
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,2048,768,8,128,4,8,balanced,0.18330132961273193
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,2048,768,8,128,4,8,power_law_1.01,0.03809280097484589
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,2048,768,8,128,4,8,balanced,0.39553598562876385
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,2048,768,8,128,4,8,power_law_1.01,0.03940480053424835
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,2048,768,8,128,4,8,power_law_1.01,0.042412799596786496
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,2048,768,8,128,4,8,balanced,0.24450665712356567
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,2048,768,8,128,4,8,balanced,0.4550880193710327
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,2048,768,8,128,4,8,power_law_1.01,0.04778240025043488
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,2048,768,8,128,4,8,power_law_1.01,0.05262719988822937
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,2048,768,8,128,4,8,power_law_1.01,0.055430400371551516
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,2048,768,8,128,4,8,balanced,0.353434681892395
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,2048,768,8,128,4,8,power_law_1.01,0.06704000234603882
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,2048,768,8,128,4,8,power_law_1.01,0.07537279725074768
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,2048,768,8,128,4,8,power_law_1.01,0.09354239702224731
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,2048,768,8,128,4,8,power_law_1.01,0.11975040435791015
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,2048,768,8,128,4,8,power_law_1.2,0.02563199996948242
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,2048,768,8,128,4,8,balanced,0.6334346532821655
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,2048,768,8,128,4,8,power_law_1.01,0.15029120445251465
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,2048,768,8,128,4,8,power_law_1.2,0.022444799542427063
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,2048,768,8,128,4,8,balanced,0.45949331919352215
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,2048,768,8,128,4,8,power_law_1.2,0.022720000147819518
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,2048,768,8,128,4,8,power_law_1.01,0.17933440208435059
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,2048,768,8,128,4,8,power_law_1.2,0.029254400730133058
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,2048,768,8,128,4,8,power_law_1.01,0.36972799301147463
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,2048,768,8,128,4,8,power_law_1.2,0.02728320062160492
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,2048,768,8,128,4,8,power_law_1.2,0.02908799946308136
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,2048,768,8,128,4,8,power_law_1.01,0.3428607940673828
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,2048,768,8,128,4,8,power_law_1.2,0.029843199253082275
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,2048,768,8,128,4,8,power_law_1.01,0.5506048202514648
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,2048,768,8,128,4,8,power_law_1.2,0.03170560002326965
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,2048,768,8,128,4,8,power_law_1.01,0.7093952178955079
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,2048,768,8,128,4,8,power_law_1.2,0.032691198587417605
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,2048,768,8,128,4,8,power_law_1.01,0.9073087692260742
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,2048,768,8,128,4,8,power_law_1.2,0.03452799916267395
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,2048,768,8,128,4,8,power_law_1.2,0.03767040073871612
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,2048,768,8,128,4,8,balanced,0.5692586501439413
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,2048,768,8,128,4,8,power_law_1.01,1.5676544189453125
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,2048,768,8,128,4,8,power_law_1.2,0.03749760091304779
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,2048,768,8,128,4,8,power_law_1.2,0.03857919871807099
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,2048,768,8,128,4,8,power_law_1.01,2.684947204589844
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,2048,768,8,128,4,8,power_law_1.2,0.04635519981384277
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,2048,768,8,128,4,8,power_law_1.2,0.049395200610160825
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,2048,768,8,128,4,8,power_law_1.2,0.05255039930343628
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,2048,768,8,128,4,8,power_law_1.2,0.058316802978515624
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,2048,768,8,128,4,8,balanced,0.8526720205942789
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,2048,768,8,128,4,8,power_law_1.2,0.0671999990940094
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,2048,768,8,128,4,8,power_law_1.2,0.06952319741249084
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,2048,768,8,128,4,8,power_law_1.2,0.07857919931411743
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,2048,768,8,128,4,8,power_law_1.2,0.09144319891929627
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,2048,768,8,128,4,8,power_law_1.2,0.035283198952674864
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,2048,768,8,128,4,8,power_law_1.2,0.11179519891738891
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,2048,768,8,128,4,8,power_law_1.2,0.12634240388870238
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,2048,768,8,128,4,8,power_law_1.2,0.02951039969921112
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,2048,768,8,128,4,8,balanced,0.8878453572591146
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,2048,768,8,128,4,8,power_law_1.2,0.16762239933013917
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,2048,768,8,128,4,8,power_law_1.2,0.030713599920272828
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,2048,768,8,128,4,8,balanced,1.1966026624043782
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,2048,768,8,128,4,8,power_law_1.2,0.03310079872608185
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,2048,768,8,128,4,8,power_law_1.2,0.22560639381408693
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,2048,768,8,128,4,8,power_law_1.2,0.034355199337005614
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,2048,768,8,128,4,8,power_law_1.2,0.36608641147613524
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,2048,768,8,128,4,8,power_law_1.2,0.03620480000972748
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,2048,768,8,128,4,8,power_law_1.2,0.45352959632873535
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,2048,768,8,128,4,8,power_law_1.2,0.03637759983539581
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,2048,768,8,128,4,8,power_law_1.2,0.5617728233337402
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,2048,768,8,128,4,8,power_law_1.2,0.03743360042572021
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,2048,768,8,128,4,8,power_law_1.2,1.0981951713562013
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,2048,768,8,128,4,8,power_law_1.2,0.038387200236320494
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,2048,768,8,128,4,8,power_law_1.2,0.03909119963645935
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,2048,768,8,128,4,8,power_law_1.2,1.9476095199584962
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,2048,768,8,128,4,8,power_law_1.2,0.039878401160240176
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,2048,768,8,128,4,8,power_law_1.2,0.041017600893974306
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,2048,768,8,128,4,8,power_law_1.2,0.044377601146698
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,2048,768,8,128,4,8,power_law_1.2,0.04237439930438995
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,2048,768,8,128,4,8,power_law_1.2,0.04648320078849792
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,2048,768,8,128,4,8,power_law_1.2,0.0495743989944458
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,2048,768,8,128,4,8,power_law_1.2,0.05605760216712952
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,2048,768,8,128,4,8,power_law_1.2,0.06490880250930786
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,2048,768,8,128,4,8,power_law_1.2,0.06949120163917541
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,2048,768,8,128,4,8,power_law_1.2,0.08435840010643006
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,2048,768,8,128,4,8,power_law_1.2,0.10566400289535523
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,2048,768,8,128,4,8,power_law_1.2,0.1293951988220215
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,2048,768,8,128,4,8,power_law_1.2,0.16629120111465454
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,2048,768,8,128,4,8,power_law_1.2,0.027647998929023743
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,2048,768,8,128,4,8,power_law_1.2,0.2480384111404419
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,2048,768,8,128,4,8,balanced,1.7508373260498047
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,2048,768,8,128,4,8,power_law_1.2,0.26201601028442384
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,2048,768,8,128,4,8,power_law_1.2,0.026163199543952943
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,2048,768,8,128,4,8,power_law_1.2,0.4419136047363281
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,2048,768,8,128,4,8,power_law_1.2,0.026156800985336303
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,2048,768,8,128,4,8,power_law_1.2,0.02881920039653778
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,2048,768,8,128,4,8,power_law_1.2,0.6193600177764893
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,2048,768,8,128,4,8,power_law_1.2,0.029785600304603577
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,2048,768,8,128,4,8,power_law_1.2,0.7459775924682617
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,2048,768,8,128,4,8,power_law_1.2,0.033011201024055484
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,2048,768,8,128,4,8,power_law_1.2,1.300166416168213
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,2048,768,8,128,4,8,power_law_1.2,0.03324800133705139
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,2048,768,8,128,4,8,power_law_1.2,0.03480960130691528
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,4096,1536,8,128,1,32,balanced,0.0384853333234787
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,2048,768,8,128,4,8,power_law_1.2,3.2861248016357423
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,2048,768,8,128,4,8,power_law_1.2,0.03566080033779144
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,4096,1536,8,128,1,32,balanced,0.03825599948565165
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,4096,1536,8,128,1,32,balanced,0.03818133225043615
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,2048,768,8,128,4,8,power_law_1.2,0.03589119911193848
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,4096,1536,8,128,1,32,balanced,0.04879466692606608
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,4096,1536,8,128,1,32,balanced,0.06492800017197926
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,4096,1536,8,128,1,32,balanced,0.06645333270231883
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,2048,768,8,128,4,8,power_law_1.2,0.03800959885120392
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,4096,1536,8,128,1,32,balanced,0.06564799944559734
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,2048,768,8,128,4,8,power_law_1.2,0.040064001083374025
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,4096,1536,8,128,1,32,balanced,0.06666133304437001
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,2048,768,8,128,4,8,power_law_1.2,0.03973119854927063
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,4096,1536,8,128,1,32,balanced,0.06711466610431671
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,4096,1536,8,128,1,32,balanced,0.06708799799283345
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,2048,768,8,128,4,8,power_law_1.2,0.045388799905776975
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,4096,1536,8,128,1,32,balanced,0.06749333441257477
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,4096,1536,8,128,1,32,balanced,0.06821866830190022
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,4096,1536,8,128,1,32,balanced,0.0691786656777064
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,2048,768,8,128,4,8,power_law_1.2,0.050323200225830075
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,4096,1536,8,128,1,32,balanced,0.07564799984296162
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,2048,768,8,128,4,8,power_law_1.2,0.05591040253639221
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,4096,1536,8,128,1,32,balanced,0.07425066828727722
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,4096,1536,8,128,1,32,balanced,0.08003733555475871
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,4096,1536,8,128,1,32,balanced,0.08303466439247131
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,4096,1536,8,128,1,32,balanced,0.08125866452852885
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,2048,768,8,128,4,8,power_law_1.2,0.05736960172653198
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,4096,1536,8,128,1,32,balanced,0.08450667063395183
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,2048,768,8,128,4,8,power_law_1.2,0.06954240202903747
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,4096,1536,8,128,1,32,balanced,0.08660266796747844
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,2048,768,8,128,4,8,power_law_1.2,0.08843520283699036
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,4096,1536,8,128,1,32,balanced,0.09844266374905904
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,2048,768,8,128,4,8,power_law_1.2,0.10720640420913696
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,4096,1536,8,128,1,32,balanced,0.11544000109036763
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,2048,768,8,128,4,8,power_law_1.2,0.12821760177612304
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,2048,768,8,128,4,8,power_law_1.2,0.17265280485153198
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,4096,1536,8,128,1,32,balanced,0.11994133392969768
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,2048,768,8,128,4,8,power_law_1.2,0.23653120994567872
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,4096,1536,8,128,1,32,balanced,0.18084800243377686
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,2048,768,8,128,4,8,power_law_1.2,0.3539007902145386
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,2048,768,8,128,4,8,power_law_1.2,0.4168255805969238
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,2048,768,8,128,4,8,power_law_1.2,0.700051212310791
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,4096,1536,8,128,1,32,balanced,0.19139200448989868
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,2048,768,8,128,4,8,power_law_1.2,1.0257408142089843
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,2048,768,8,128,4,8,power_law_1.2,1.2795583724975585
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,2048,768,8,128,4,8,power_law_1.2,2.1326847076416016
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,4096,1536,8,128,1,32,balanced,0.033439998825391136
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,2048,768,8,128,4,8,power_law_1.2,4.233324813842773
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,4096,1536,8,128,1,32,balanced,0.26764265696207684
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,4096,1536,8,128,1,32,balanced,0.03359466542800268
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,4096,1536,8,128,1,32,balanced,0.03345066557327906
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,4096,1536,8,128,1,32,balanced,0.03587199995915095
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,4096,1536,8,128,1,32,balanced,0.05136000116666158
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,4096,1536,8,128,1,32,balanced,0.05276800195376078
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,4096,1536,8,128,1,32,balanced,0.05249066650867462
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,4096,1536,8,128,1,32,balanced,0.05308799942334493
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,4096,1536,8,128,1,32,balanced,0.30501333872477215
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,4096,1536,8,128,1,32,balanced,0.05292266607284546
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,4096,1536,8,128,1,32,balanced,0.054229333996772766
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,4096,1536,8,128,1,32,balanced,0.055386667450269066
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,4096,1536,8,128,1,32,balanced,0.055439998706181846
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,4096,1536,8,128,1,32,balanced,0.05641066531340281
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,4096,1536,8,128,1,32,balanced,0.0577706644932429
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,4096,1536,8,128,1,32,power_law_1.01,0.060710400342941284
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,4096,1536,8,128,1,32,balanced,0.028069332242012024
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,4096,1536,8,128,1,32,balanced,0.06118399898211161
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,4096,1536,8,128,1,32,power_law_1.01,0.05262719988822937
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,4096,1536,8,128,1,32,balanced,0.02829866607983907
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,4096,1536,8,128,1,32,balanced,0.06195733447869619
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,4096,1536,8,128,1,32,balanced,0.3809066613515218
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,4096,1536,8,128,1,32,power_law_1.01,0.04888960123062134
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,4096,1536,8,128,1,32,balanced,0.02829866607983907
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,4096,1536,8,128,1,32,balanced,0.06487466891606648
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,4096,1536,8,128,1,32,power_law_1.01,0.05926399827003479
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,4096,1536,8,128,1,32,balanced,0.03215466688076655
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,4096,1536,8,128,1,32,power_law_1.01,0.05947520136833191
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,4096,1536,8,128,1,32,balanced,0.06855999926726024
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,4096,1536,8,128,1,32,balanced,0.046623999873797096
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,4096,1536,8,128,1,32,power_law_1.01,0.06484479904174804
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,4096,1536,8,128,1,32,balanced,0.04729066789150238
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,4096,1536,8,128,1,32,balanced,0.07458133498827617
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,4096,1536,8,128,1,32,power_law_1.01,0.04705919921398163
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,4096,1536,8,128,1,32,power_law_1.01,0.06564480066299438
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,4096,1536,8,128,1,32,balanced,0.047637333472569786
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,4096,1536,8,128,1,32,power_law_1.01,0.0663424015045166
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,4096,1536,8,128,1,32,balanced,0.08577600121498108
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,4096,1536,8,128,1,32,power_law_1.01,0.042956799268722534
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,4096,1536,8,128,1,32,balanced,0.04762666424115499
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,4096,1536,8,128,1,32,power_law_1.01,0.06694399714469909
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,4096,1536,8,128,1,32,power_law_1.01,0.039852800965309146
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,4096,1536,8,128,1,32,balanced,0.0481279989083608
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,4096,1536,8,128,1,32,balanced,0.09367466966311137
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,4096,1536,8,128,1,32,power_law_1.01,0.07048320174217224
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,4096,1536,8,128,1,32,power_law_1.01,0.04309119880199432
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,4096,1536,8,128,1,32,balanced,0.04863999783992767
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,4096,1536,8,128,1,32,power_law_1.01,0.07074559926986694
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,4096,1536,8,128,1,32,power_law_1.01,0.04633600115776062
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,4096,1536,8,128,1,32,balanced,0.049322664737701416
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,4096,1536,8,128,1,32,power_law_1.01,0.07725440263748169
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,4096,1536,8,128,1,32,balanced,0.1129813293615977
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,4096,1536,8,128,1,32,power_law_1.01,0.05234559774398804
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,4096,1536,8,128,1,32,balanced,0.0499946673711141
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,4096,1536,8,128,1,32,power_law_1.01,0.0788927972316742
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,4096,1536,8,128,1,32,power_law_1.01,0.051520001888275144
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,4096,1536,8,128,1,32,balanced,0.05076266825199127
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,4096,1536,8,128,1,32,power_law_1.01,0.08227840065956116
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,4096,1536,8,128,1,32,power_law_1.01,0.05270400047302246
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,4096,1536,8,128,1,32,balanced,0.051413332422574363
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,4096,1536,8,128,1,32,balanced,0.12711466352144876
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,4096,1536,8,128,1,32,balanced,0.5742719968159994
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,4096,1536,8,128,1,32,power_law_1.01,0.08499199748039246
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,4096,1536,8,128,1,32,power_law_1.01,0.056953597068786624
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,4096,1536,8,128,1,32,power_law_1.01,0.0939520001411438
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,4096,1536,8,128,1,32,power_law_1.01,0.05486720204353333
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,4096,1536,8,128,1,32,power_law_1.01,0.05605760216712952
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,4096,1536,8,128,1,32,power_law_1.01,0.101254403591156
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,4096,1536,8,128,1,32,balanced,0.18285866578420004
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,4096,1536,8,128,1,32,power_law_1.01,0.061401599645614625
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,4096,1536,8,128,1,32,power_law_1.01,0.11250560283660889
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,4096,1536,8,128,1,32,balanced,0.05606399973233541
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,4096,1536,8,128,1,32,power_law_1.01,0.06445440053939819
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,4096,1536,8,128,1,32,power_law_1.01,0.12368639707565307
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,4096,1536,8,128,1,32,balanced,0.05630399783452352
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,4096,1536,8,128,1,32,power_law_1.01,0.06445440053939819
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,4096,1536,8,128,1,32,power_law_1.01,0.13835519552230835
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,4096,1536,8,128,1,32,power_law_1.01,0.06917120218276977
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,4096,1536,8,128,1,32,power_law_1.01,0.18046720027923585
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,4096,1536,8,128,1,32,balanced,0.2100586692492167
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,4096,1536,8,128,1,32,power_law_1.01,0.07822719812393189
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,4096,1536,8,128,1,32,power_law_1.01,0.26184959411621095
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,4096,1536,8,128,1,32,power_law_1.01,0.043654400110244754
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,4096,1536,8,128,1,32,power_law_1.01,0.07715200185775757
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,4096,1536,8,128,1,32,power_law_1.01,0.28406400680541993
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,4096,1536,8,128,1,32,power_law_1.01,0.0917568027973175
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,4096,1536,8,128,1,32,power_law_1.01,0.03509120047092438
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,4096,1536,8,128,1,32,power_law_1.01,0.3897984027862549
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,4096,1536,8,128,1,32,power_law_1.01,0.10308480262756348
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,4096,1536,8,128,1,32,power_law_1.01,0.03369599878787995
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,4096,1536,8,128,1,32,power_law_1.01,0.4756159782409668
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,4096,1536,8,128,1,32,power_law_1.2,0.06036480069160462
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,4096,1536,8,128,1,32,power_law_1.01,0.13979519605636598
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,4096,1536,8,128,1,32,power_law_1.01,0.036051198840141296
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,4096,1536,8,128,1,32,power_law_1.01,0.6724480152130127
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,4096,1536,8,128,1,32,power_law_1.01,0.14850560426712037
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,4096,1536,8,128,1,32,balanced,0.05932799975077311
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,4096,1536,8,128,1,32,power_law_1.2,0.0463808000087738
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,4096,1536,8,128,1,32,power_law_1.01,0.04229120016098022
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,4096,1536,8,128,1,32,balanced,0.30004266897837323
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,4096,1536,8,128,1,32,power_law_1.01,0.9053695678710938
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,4096,1536,8,128,1,32,power_law_1.01,0.20369279384613037
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,4096,1536,8,128,1,32,power_law_1.2,0.048403200507164
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,4096,1536,8,128,1,32,power_law_1.01,0.046623998880386354
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,4096,1536,8,128,1,32,balanced,0.06491733094056447
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,4096,1536,8,128,1,32,power_law_1.01,1.2977855682373047
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,4096,1536,8,128,1,32,power_law_1.01,0.23551359176635742
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,4096,1536,8,128,1,32,power_law_1.2,0.05751039981842041
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,4096,1536,8,128,1,32,power_law_1.01,0.04764159917831421
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,4096,1536,8,128,1,32,power_law_1.01,2.023699188232422
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,4096,1536,8,128,1,32,balanced,0.0673226664463679
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,4096,1536,8,128,1,32,power_law_1.01,0.32127358913421633
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,4096,1536,8,128,1,32,power_law_1.01,0.04819200038909912
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,4096,1536,8,128,1,32,power_law_1.2,0.05533440113067627
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,4096,1536,8,128,1,32,power_law_1.01,0.4293504238128662
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,4096,1536,8,128,1,32,power_law_1.01,3.6620929718017576
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,4096,1536,8,128,1,32,power_law_1.01,0.05114240050315857
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,4096,1536,8,128,1,32,power_law_1.2,0.0652288019657135
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,4096,1536,8,128,1,32,power_law_1.01,0.6408448219299316
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,4096,1536,8,128,1,32,power_law_1.2,0.06313599944114685
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,4096,1536,8,128,1,32,power_law_1.01,0.05262719988822937
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,4096,1536,8,128,1,32,power_law_1.01,0.9283647537231445
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,4096,1536,8,128,1,32,balanced,0.07726400097211202
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,4096,1536,8,128,1,32,power_law_1.2,0.06818559765815735
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,4096,1536,8,128,1,32,power_law_1.01,0.057183998823165896
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,4096,1536,8,128,1,32,balanced,0.36584532260894775
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,4096,1536,8,128,1,32,power_law_1.01,0.8319680213928222
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,4096,1536,8,128,1,32,power_law_1.2,0.06794880032539367
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,4096,1536,8,128,1,32,power_law_1.01,0.057920002937316896
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,4096,1536,8,128,1,32,balanced,0.08386666576067607
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,4096,1536,8,128,1,32,power_law_1.2,0.07151359915733338
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,4096,1536,8,128,1,32,power_law_1.01,0.06096640229225159
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,4096,1536,8,128,1,32,power_law_1.01,1.3932671546936035
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,4096,1536,8,128,1,32,power_law_1.2,0.07303040027618408
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,4096,1536,8,128,1,32,power_law_1.01,0.06796159744262695
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,4096,1536,8,128,1,32,balanced,1.096880038579305
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,4096,1536,8,128,1,32,balanced,0.1104159951210022
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,4096,1536,8,128,1,32,power_law_1.01,3.446041488647461
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,4096,1536,8,128,1,32,power_law_1.2,0.22016639709472657
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,4096,1536,8,128,1,32,power_law_1.2,0.3617856025695801
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,4096,1536,8,128,1,32,power_law_1.01,0.07374079823493958
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,4096,1536,8,128,1,32,balanced,0.12359999616940816
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,4096,1536,8,128,1,32,power_law_1.2,0.08508800268173218
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,4096,1536,8,128,1,32,power_law_1.01,0.07824000120162963
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,4096,1536,8,128,1,32,power_law_1.2,0.09422720074653626
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,4096,1536,8,128,1,32,power_law_1.2,0.1076159954071045
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,4096,1536,8,128,1,32,balanced,0.45022400220235187
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,4096,1536,8,128,1,32,balanced,0.16870399316151938
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,4096,1536,8,128,1,32,power_law_1.2,0.10618879795074462
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,4096,1536,8,128,1,32,power_law_1.01,0.07592319846153259
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,4096,1536,8,128,1,32,power_law_1.2,0.13054720163345337
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,4096,1536,8,128,1,32,power_law_1.01,0.09884799718856811
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,4096,1536,8,128,1,32,power_law_1.2,0.14362239837646484
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,4096,1536,8,128,1,32,power_law_1.01,0.11346559524536133
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,4096,1536,8,128,1,32,power_law_1.2,0.17481600046157836
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,4096,1536,8,128,1,32,balanced,0.20961600542068481
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,4096,1536,8,128,1,32,power_law_1.01,0.14205440282821655
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,4096,1536,8,128,1,32,power_law_1.2,0.22355198860168457
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,4096,1536,8,128,1,32,power_law_1.01,0.15831040143966674
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,4096,1536,8,128,1,32,power_law_1.2,0.3529344081878662
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,4096,1536,8,128,1,32,power_law_1.01,0.2145792007446289
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,4096,1536,8,128,1,32,power_law_1.2,0.3380863904953003
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,4096,1536,8,128,1,32,power_law_1.01,0.31675519943237307
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,4096,1536,8,128,1,32,power_law_1.2,0.4955776214599609
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,4096,1536,8,128,1,32,power_law_1.01,0.48046078681945803
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,4096,1536,8,128,1,32,power_law_1.2,0.7932096004486084
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,4096,1536,8,128,1,32,power_law_1.01,0.56462721824646
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,4096,1536,8,128,1,32,power_law_1.2,1.3473471641540526
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,4096,1536,8,128,1,32,power_law_1.2,1.2226176261901855
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,4096,1536,8,128,1,32,balanced,0.3170986572901408
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,4096,1536,8,128,1,32,balanced,0.6837973594665527
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,4096,1536,8,128,1,32,power_law_1.2,1.9233280181884767
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,4096,1536,8,128,1,32,power_law_1.01,0.8902463912963867
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,4096,1536,8,128,1,32,power_law_1.01,1.1501824378967285
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,4096,1536,8,128,1,32,power_law_1.2,3.1318336486816407
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,4096,1536,8,128,1,32,power_law_1.01,1.3980352401733398
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,4096,1536,8,128,1,32,power_law_1.2,6.663980865478516
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,4096,1536,8,128,1,32,power_law_1.01,2.775494384765625
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,4096,1536,8,128,1,32,power_law_1.2,0.047091200947761536
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,4096,1536,8,128,1,32,power_law_1.01,4.915500640869141
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,4096,1536,8,128,1,32,power_law_1.2,0.035699200630187986
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,4096,1536,8,128,1,32,balanced,0.4139893452326457
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,4096,1536,8,128,1,32,power_law_1.2,0.040608000755310056
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,4096,1536,8,128,1,32,power_law_1.2,0.043219199776649474
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,4096,1536,8,128,1,32,power_law_1.2,0.04280959963798523
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,4096,1536,8,128,1,32,power_law_1.2,0.05245440006256104
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,4096,1536,8,128,1,32,power_law_1.2,0.052288001775741576
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,4096,1536,8,128,1,32,power_law_1.2,0.05317760109901428
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,4096,1536,8,128,1,32,power_law_1.2,0.05484799742698669
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,4096,1536,8,128,1,32,balanced,0.5245920022328695
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,4096,1536,8,128,1,32,power_law_1.2,0.056550401449203494
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,4096,1536,8,128,1,32,power_law_1.2,0.06113920211791992
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,4096,1536,8,128,1,32,power_law_1.2,0.06416000127792358
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,4096,1536,8,128,1,32,power_law_1.2,0.06481919884681701
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,4096,1536,8,128,1,32,power_law_1.2,0.06724479794502258
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,4096,1536,8,128,1,32,power_law_1.2,0.07203199863433837
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,4096,1536,8,128,1,32,power_law_1.2,0.07845759987831116
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,4096,1536,8,128,1,32,power_law_1.2,0.07754240036010743
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,4096,1536,8,128,1,32,power_law_1.2,0.0981440007686615
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,4096,1536,8,128,1,32,balanced,1.3199146588643391
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,4096,1536,8,128,1,32,power_law_1.2,0.11735680103302001
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,4096,1536,8,128,1,32,power_law_1.2,0.1601088047027588
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,4096,1536,8,128,1,32,power_law_1.2,0.1699455976486206
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,4096,1536,8,128,1,32,balanced,0.8144266605377197
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,4096,1536,8,128,1,32,power_law_1.2,0.22749440670013427
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,4096,1536,8,128,1,32,power_law_1.2,0.28748159408569335
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,4096,1536,8,128,1,32,power_law_1.2,0.39028480052948
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,4096,1536,8,128,1,32,power_law_1.2,0.5341055870056153
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,4096,1536,8,128,1,32,power_law_1.2,0.8997247695922852
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,4096,1536,8,128,1,32,power_law_1.2,1.2687744140625
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,4096,1536,8,128,1,32,power_law_1.2,1.4858624458312988
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,4096,1536,8,128,1,32,power_law_1.2,2.749017524719238
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,4096,1536,8,128,1,32,power_law_1.2,5.668620681762695
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,4096,1536,8,128,1,32,power_law_1.2,0.0435263991355896
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,4096,1536,8,128,1,32,power_law_1.2,0.02971520125865936
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,4096,1536,8,128,1,32,balanced,1.6131733258565266
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,4096,1536,8,128,1,32,power_law_1.2,0.0341376006603241
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,4096,1536,8,128,1,32,power_law_1.2,0.03882879912853241
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,4096,1536,8,128,2,16,balanced,0.03324799984693527
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,4096,1536,8,128,1,32,power_law_1.2,0.039827200770378116
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,4096,1536,8,128,2,16,balanced,0.03506666670242945
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,4096,1536,8,128,2,16,balanced,0.033189333975315094
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,4096,1536,8,128,1,32,power_law_1.2,0.046374401450157164
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,4096,1536,8,128,2,16,balanced,0.037205333511034645
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,4096,1536,8,128,2,16,balanced,0.03372266640265783
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,4096,1536,8,128,1,32,power_law_1.2,0.0463808000087738
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,4096,1536,8,128,2,16,balanced,0.03754133234421412
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,4096,1536,8,128,2,16,balanced,0.03740799923737844
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,4096,1536,8,128,1,32,power_law_1.2,0.05114240050315857
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,4096,1536,8,128,2,16,balanced,0.04811733464399973
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,4096,1536,8,128,2,16,balanced,0.05217599868774414
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,4096,1536,8,128,1,32,power_law_1.2,0.05204480290412903
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,4096,1536,8,128,2,16,balanced,0.05369600156943003
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,4096,1536,8,128,2,16,balanced,0.06761600077152252
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,4096,1536,8,128,2,16,balanced,0.053914666175842285
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,4096,1536,8,128,2,16,balanced,0.06264000137646993
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,4096,1536,8,128,1,32,power_law_1.2,0.05491840243339539
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,4096,1536,8,128,2,16,balanced,0.05382933219273885
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,4096,1536,8,128,2,16,balanced,0.06344533463319142
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,4096,1536,8,128,1,32,power_law_1.2,0.0580735981464386
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,4096,1536,8,128,2,16,balanced,0.05429333448410034
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,4096,1536,8,128,2,16,balanced,0.06699199974536896
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,4096,1536,8,128,1,32,power_law_1.2,0.06251519918441772
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,4096,1536,8,128,2,16,balanced,0.06753600140412648
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,4096,1536,8,128,2,16,balanced,0.055029332637786865
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,4096,1536,8,128,1,32,power_law_1.2,0.06142079830169678
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,4096,1536,8,128,2,16,balanced,0.06750399867693584
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,4096,1536,8,128,2,16,balanced,0.055786664287249245
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,4096,1536,8,128,1,32,power_law_1.2,0.07340800166130065
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,4096,1536,8,128,2,16,balanced,0.06875200072924297
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,4096,1536,8,128,2,16,balanced,0.056101332108179726
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,4096,1536,8,128,2,16,balanced,0.06925866504510243
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,4096,1536,8,128,2,16,balanced,0.05649066468079885
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,4096,1536,8,128,1,32,power_law_1.2,0.07793279886245727
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,4096,1536,8,128,2,16,balanced,0.07027733325958252
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,4096,1536,8,128,2,16,balanced,0.05789333085219065
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,4096,1536,8,128,1,32,power_law_1.2,0.08150399923324585
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,4096,1536,8,128,2,16,balanced,0.07256000240643819
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,4096,1536,8,128,2,16,balanced,0.0626986672480901
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,4096,1536,8,128,2,16,balanced,0.07633066674073537
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,4096,1536,8,128,2,16,balanced,0.06337066491444905
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,4096,1536,8,128,2,16,balanced,0.0772213339805603
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,4096,1536,8,128,2,16,balanced,0.06594133377075195
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,4096,1536,8,128,1,32,power_law_1.2,0.08550400137901307
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,4096,1536,8,128,2,16,balanced,0.07865599791208903
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,4096,1536,8,128,1,32,power_law_1.2,0.10535039901733398
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,4096,1536,8,128,2,16,balanced,0.07154666880766551
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,4096,1536,8,128,2,16,balanced,0.08133866886297862
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,4096,1536,8,128,1,32,power_law_1.2,0.12098560333251954
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,4096,1536,8,128,2,16,balanced,0.07613866527875264
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,4096,1536,8,128,2,16,balanced,0.0863146682580312
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,4096,1536,8,128,2,16,balanced,0.08561600248018901
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,4096,1536,8,128,1,32,power_law_1.2,0.19682559967041016
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,4096,1536,8,128,2,16,balanced,0.09239466985066731
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,4096,1536,8,128,2,16,balanced,0.0957973301410675
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,4096,1536,8,128,1,32,power_law_1.2,0.2009216070175171
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,4096,1536,8,128,2,16,balanced,0.1079253355662028
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,4096,1536,8,128,1,32,power_law_1.2,0.3180927991867065
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,4096,1536,8,128,2,16,balanced,0.12460266550381978
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,4096,1536,8,128,1,32,power_law_1.2,0.4519552230834961
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,4096,1536,8,128,2,16,balanced,0.1251626710096995
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,4096,1536,8,128,1,32,power_law_1.2,0.7137792110443115
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,4096,1536,8,128,2,16,balanced,0.027802666028340656
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,4096,1536,8,128,2,16,balanced,0.1400320033232371
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,4096,1536,8,128,2,16,power_law_1.01,0.06461439728736877
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,4096,1536,8,128,1,32,power_law_1.2,0.9400447845458985
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,4096,1536,8,128,2,16,balanced,0.027914665639400482
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,4096,1536,8,128,2,16,balanced,0.02920000006755193
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,4096,1536,8,128,2,16,power_law_1.01,0.05516800284385681
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,4096,1536,8,128,2,16,balanced,0.12965866923332214
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,4096,1536,8,128,2,16,balanced,0.032645332316557564
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,4096,1536,8,128,1,32,power_law_1.2,1.3006015777587892
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,4096,1536,8,128,2,16,power_law_1.01,0.043296000361442565
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,4096,1536,8,128,2,16,balanced,0.04791999856630961
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,4096,1536,8,128,2,16,balanced,0.20152533054351807
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,4096,1536,8,128,1,32,power_law_1.2,1.6452928543090821
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,4096,1536,8,128,2,16,power_law_1.01,0.049446401000022885
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,4096,1536,8,128,2,16,balanced,0.048298666874567665
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,4096,1536,8,128,2,16,balanced,0.04887466629346212
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,4096,1536,8,128,2,16,power_law_1.01,0.05847679972648621
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,4096,1536,8,128,1,32,power_law_1.2,2.498188781738281
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,4096,1536,8,128,2,16,balanced,0.1921173334121704
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,4096,1536,8,128,2,16,balanced,0.04868799944718679
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,4096,1536,8,128,2,16,power_law_1.01,0.06152960062026978
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,4096,1536,8,128,2,16,balanced,0.049770668148994446
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,4096,1536,8,128,1,32,power_law_1.2,4.369670486450195
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,4096,1536,8,128,2,16,power_law_1.01,0.06293119788169861
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,4096,1536,8,128,2,16,balanced,0.04996266464392344
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,4096,1536,8,128,2,16,balanced,0.24059200286865234
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,4096,1536,8,128,2,16,power_law_1.01,0.06595199704170226
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,4096,1536,8,128,2,16,balanced,0.05109866460164388
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,4096,1536,8,128,1,32,power_law_1.2,10.675129699707032
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,4096,1536,8,128,2,16,power_law_1.01,0.06871680021286011
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,4096,1536,8,128,2,16,balanced,0.21607999006907144
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,4096,1536,8,128,2,16,balanced,0.051514665285746254
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,4096,1536,8,128,2,16,power_law_1.01,0.06881279945373535
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,4096,1536,8,128,2,16,balanced,0.052560001611709595
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,4096,1536,8,128,2,16,balanced,0.053823997577031456
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,4096,1536,8,128,2,16,power_law_1.01,0.07406079769134521
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,4096,1536,8,128,2,16,power_law_1.01,0.08165760040283203
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,4096,1536,8,128,2,16,power_law_1.01,0.0775871992111206
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,4096,1536,8,128,2,16,balanced,0.3458346525828044
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,4096,1536,8,128,2,16,power_law_1.01,0.08199040293693542
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,4096,1536,8,128,2,16,power_law_1.01,0.08900480270385742
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,4096,1536,8,128,2,16,power_law_1.01,0.049158400297164916
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,4096,1536,8,128,2,16,balanced,0.3048906723658244
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,4096,1536,8,128,2,16,balanced,0.05898133416970571
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,4096,1536,8,128,2,16,power_law_1.01,0.09251840114593506
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,4096,1536,8,128,2,16,power_law_1.01,0.0400191992521286
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,4096,1536,8,128,2,16,power_law_1.01,0.09412479996681214
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,4096,1536,8,128,2,16,balanced,0.059392000238100685
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,4096,1536,8,128,2,16,power_law_1.01,0.10812159776687622
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,4096,1536,8,128,2,16,power_law_1.01,0.03441280126571655
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,4096,1536,8,128,2,16,power_law_1.01,0.1250432014465332
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,4096,1536,8,128,2,16,power_law_1.01,0.039027199149131775
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,4096,1536,8,128,2,16,power_law_1.01,0.14062080383300782
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,4096,1536,8,128,2,16,power_law_1.01,0.045875200629234315
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,4096,1536,8,128,2,16,power_law_1.01,0.05141119956970215
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,4096,1536,8,128,2,16,power_law_1.01,0.19453439712524415
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,4096,1536,8,128,2,16,balanced,0.430458664894104
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,4096,1536,8,128,2,16,power_law_1.01,0.05226879715919495
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,4096,1536,8,128,2,16,power_law_1.01,0.24669439792633058
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,4096,1536,8,128,2,16,power_law_1.01,0.05278720259666443
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,4096,1536,8,128,2,16,power_law_1.01,0.22666239738464355
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,4096,1536,8,128,2,16,power_law_1.01,0.05310080051422119
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,4096,1536,8,128,2,16,balanced,0.06413866579532623
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,4096,1536,8,128,2,16,balanced,0.3596266508102417
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,4096,1536,8,128,2,16,power_law_1.01,0.311244797706604
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,4096,1536,8,128,2,16,power_law_1.01,0.05467519760131836
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,4096,1536,8,128,2,16,power_law_1.01,0.3990911960601807
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,4096,1536,8,128,2,16,balanced,0.07160533467928569
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,4096,1536,8,128,2,16,power_law_1.01,0.05428479909896851
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,4096,1536,8,128,2,16,power_law_1.01,0.7151487827301025
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,4096,1536,8,128,2,16,power_law_1.01,0.057094401121139525
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,4096,1536,8,128,2,16,balanced,0.07436800003051758
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,4096,1536,8,128,2,16,power_law_1.01,0.05839359760284424
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,4096,1536,8,128,2,16,power_law_1.01,0.8166015625
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,4096,1536,8,128,2,16,power_law_1.01,0.06335999965667724
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,4096,1536,8,128,2,16,power_law_1.01,0.8308735847473144
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,4096,1536,8,128,2,16,power_law_1.01,0.07066879868507385
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,4096,1536,8,128,2,16,power_law_1.01,1.464358425140381
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,4096,1536,8,128,2,16,power_law_1.01,0.07344639897346497
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,4096,1536,8,128,2,16,power_law_1.01,0.07648640275001525
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,4096,1536,8,128,2,16,balanced,0.5313493410746256
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,4096,1536,8,128,2,16,power_law_1.01,3.02675838470459
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,4096,1536,8,128,2,16,balanced,0.09052266677220662
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,4096,1536,8,128,2,16,power_law_1.01,0.08700799942016602
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,4096,1536,8,128,2,16,power_law_1.01,0.10163840055465698
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,4096,1536,8,128,2,16,balanced,0.10050132870674133
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,4096,1536,8,128,2,16,balanced,0.45106665293375653
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,4096,1536,8,128,2,16,power_law_1.01,0.04663040041923523
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,4096,1536,8,128,2,16,power_law_1.01,0.11662080287933349
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,4096,1536,8,128,2,16,power_law_1.01,0.13974399566650392
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,4096,1536,8,128,2,16,power_law_1.01,0.03548159897327423
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,4096,1536,8,128,2,16,balanced,0.13476799925168356
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,4096,1536,8,128,2,16,power_law_1.01,0.19678080081939697
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,4096,1536,8,128,2,16,power_law_1.01,0.03116160035133362
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,4096,1536,8,128,2,16,power_law_1.01,0.03727999925613403
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,4096,1536,8,128,2,16,power_law_1.01,0.21692800521850586
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,4096,1536,8,128,2,16,balanced,0.15666133165359497
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,4096,1536,8,128,2,16,power_law_1.01,0.03871360123157501
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,4096,1536,8,128,2,16,power_law_1.01,0.29795839786529543
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,4096,1536,8,128,2,16,power_law_1.01,0.04655359983444214
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,4096,1536,8,128,2,16,power_law_1.01,0.36866559982299807
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,4096,1536,8,128,2,16,power_law_1.01,0.04890879988670349
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,4096,1536,8,128,2,16,power_law_1.01,0.04824959933757782
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,4096,1536,8,128,2,16,power_law_1.01,0.5473728179931641
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,4096,1536,8,128,2,16,balanced,0.2254613240559896
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,4096,1536,8,128,2,16,power_law_1.01,0.05296639800071716
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,4096,1536,8,128,2,16,power_law_1.01,0.7736767768859864
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,4096,1536,8,128,2,16,power_law_1.01,0.0542527973651886
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,4096,1536,8,128,2,16,power_law_1.01,0.8704192161560058
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,4096,1536,8,128,2,16,power_law_1.01,0.060601598024368285
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,4096,1536,8,128,2,16,balanced,0.8002080122629801
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,4096,1536,8,128,2,16,power_law_1.01,0.06045439839363098
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,4096,1536,8,128,2,16,power_law_1.01,1.3311552047729491
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,4096,1536,8,128,2,16,balanced,0.2988319993019104
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,4096,1536,8,128,2,16,power_law_1.01,0.06267520189285278
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,4096,1536,8,128,2,16,power_law_1.2,0.06403840184211732
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,4096,1536,8,128,2,16,balanced,0.673151969909668
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,4096,1536,8,128,2,16,power_law_1.01,0.0654528021812439
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,4096,1536,8,128,2,16,power_law_1.01,2.78287353515625
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,4096,1536,8,128,2,16,power_law_1.2,0.040838399529457094
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,4096,1536,8,128,2,16,power_law_1.2,0.04344959855079651
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,4096,1536,8,128,2,16,power_law_1.01,0.07404800057411194
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,4096,1536,8,128,2,16,power_law_1.2,0.05169919729232788
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,4096,1536,8,128,2,16,power_law_1.01,0.07663360238075256
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,4096,1536,8,128,2,16,power_law_1.2,0.05127040147781372
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,4096,1536,8,128,2,16,power_law_1.2,0.060089600086212155
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,4096,1536,8,128,2,16,power_law_1.01,0.08269439935684204
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,4096,1536,8,128,2,16,power_law_1.2,0.06661120057106018
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,4096,1536,8,128,2,16,balanced,0.4456746578216553
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,4096,1536,8,128,2,16,power_law_1.01,0.10319360494613647
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,4096,1536,8,128,2,16,power_law_1.2,0.06609920263290406
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,4096,1536,8,128,2,16,power_law_1.01,0.11852799654006958
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,4096,1536,8,128,2,16,power_law_1.2,0.06849920153617858
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,4096,1536,8,128,2,16,power_law_1.2,0.07102720141410827
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,4096,1536,8,128,2,16,power_law_1.01,0.14985599517822265
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,4096,1536,8,128,2,16,power_law_1.2,0.08101760149002075
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,4096,1536,8,128,2,16,power_law_1.01,0.1835968017578125
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,4096,1536,8,128,2,16,power_law_1.2,0.08287360072135926
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,4096,1536,8,128,2,16,power_law_1.01,0.24595839977264405
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,4096,1536,8,128,2,16,power_law_1.2,0.08594560027122497
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,4096,1536,8,128,2,16,power_law_1.01,0.35173759460449217
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,4096,1536,8,128,2,16,balanced,0.5669706662495931
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,4096,1536,8,128,2,16,power_law_1.2,0.08760319948196411
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,4096,1536,8,128,2,16,power_law_1.01,0.4577983856201172
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,4096,1536,8,128,2,16,power_law_1.2,0.09578239917755127
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,4096,1536,8,128,2,16,power_law_1.01,0.5713535785675049
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,4096,1536,8,128,2,16,power_law_1.2,0.10262399911880493
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,4096,1536,8,128,2,16,power_law_1.2,0.10061440467834473
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,4096,1536,8,128,2,16,power_law_1.01,0.9663999557495118
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,4096,1536,8,128,2,16,power_law_1.2,0.1133247971534729
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,4096,1536,8,128,2,16,power_law_1.2,0.12716799974441528
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,4096,1536,8,128,2,16,power_law_1.01,1.1669631958007813
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,4096,1536,8,128,2,16,power_law_1.2,0.1475200057029724
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,4096,1536,8,128,2,16,power_law_1.01,1.8206911087036133
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,4096,1536,8,128,2,16,power_law_1.2,0.22398719787597657
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,4096,1536,8,128,2,16,power_law_1.01,2.784185600280762
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,4096,1536,8,128,2,16,power_law_1.2,0.26584959030151367
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,4096,1536,8,128,2,16,balanced,0.7138773600260416
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,4096,1536,8,128,2,16,balanced,1.5508267084757488
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,4096,1536,8,128,2,16,power_law_1.2,0.3182528018951416
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,4096,1536,8,128,2,16,power_law_1.01,5.576793670654297
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,4096,1536,8,128,2,16,power_law_1.2,0.4445375919342041
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,4096,1536,8,128,2,16,balanced,1.295525312423706
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,4096,1536,8,128,2,16,power_law_1.2,0.5855616092681885
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,4096,1536,8,128,2,16,power_law_1.2,0.9254655838012695
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,4096,1536,8,128,2,16,power_law_1.2,1.1070079803466797
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,4096,1536,8,128,2,16,power_law_1.2,1.6888639450073242
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,4096,1536,8,128,2,16,power_law_1.2,2.6462783813476562
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,4096,1536,8,128,2,16,power_law_1.2,7.282131195068359
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,4096,1536,8,128,2,16,balanced,1.122549295425415
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,4096,1536,8,128,2,16,power_law_1.2,0.05198079943656921
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,4096,1536,8,128,2,16,power_law_1.2,0.03743360042572021
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,4096,1536,8,128,2,16,power_law_1.2,0.03449600040912628
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,4096,1536,8,128,2,16,power_law_1.2,0.03839359879493713
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,4096,1536,8,128,2,16,power_law_1.2,0.041606399416923526
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,4096,1536,8,128,2,16,power_law_1.2,0.051123201847076416
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,4096,1536,8,128,2,16,power_law_1.2,0.05275520086288452
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,4096,1536,8,128,2,16,power_law_1.2,0.052147197723388675
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,4096,1536,8,128,2,16,power_law_1.2,0.054636800289154054
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,4096,1536,8,128,2,16,power_law_1.2,0.05330560207366943
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,4096,1536,8,128,2,16,power_law_1.2,0.058355200290679934
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,4096,1536,8,128,2,16,power_law_1.2,0.058297598361968996
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,4096,1536,8,128,2,16,power_law_1.2,0.06056960225105286
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,4096,1536,8,128,2,16,balanced,2.2172160148620605
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,4096,1536,8,128,2,16,power_law_1.2,0.06639360189437866
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,4096,1536,8,128,2,16,power_law_1.2,0.07390720248222352
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,4096,1536,8,128,2,16,power_law_1.2,0.045798400044441225
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,4096,1536,8,128,2,16,power_law_1.2,0.0754751980304718
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,4096,1536,8,128,2,16,power_law_1.2,0.029836800694465638
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,4096,1536,8,128,2,16,power_law_1.2,0.07921919822692872
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,4096,1536,8,128,2,16,power_law_1.2,0.03111039996147156
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,4096,1536,8,128,2,16,power_law_1.2,0.09513599872589111
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,4096,1536,8,128,2,16,power_law_1.2,0.036908799409866334
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,4096,1536,8,128,2,16,power_law_1.2,0.10678399801254272
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,4096,1536,8,128,2,16,power_law_1.2,0.040191999077796935
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,4096,1536,8,128,2,16,power_law_1.2,0.12712960243225097
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,4096,1536,8,128,2,16,power_law_1.2,0.048044800758361816
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,4096,1536,8,128,2,16,power_law_1.2,0.15750399827957154
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,4096,1536,8,128,2,16,power_law_1.2,0.04705280065536499
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,4096,1536,8,128,2,16,power_law_1.2,0.20230400562286377
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,4096,1536,8,128,2,16,power_law_1.2,0.04938240051269531
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,4096,1536,8,128,2,16,power_law_1.2,0.25217280387878416
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,4096,1536,8,128,2,16,power_law_1.2,0.052134400606155394
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,4096,1536,8,128,2,16,power_law_1.2,0.054054397344589236
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,4096,1536,8,128,2,16,power_law_1.2,0.3719104051589966
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,4096,1536,8,128,2,16,power_law_1.2,0.49061121940612795
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,4096,1536,8,128,2,16,power_law_1.2,0.06020479798316956
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,4096,1536,8,128,2,16,power_law_1.2,0.06359040141105651
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,4096,1536,8,128,2,16,power_law_1.2,0.6840960025787354
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,4096,1536,8,128,2,16,power_law_1.2,0.0630079984664917
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,4096,1536,8,128,2,16,power_law_1.2,1.0644543647766114
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,4096,1536,8,128,2,16,power_law_1.2,0.07015680074691773
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,4096,1536,8,128,2,16,power_law_1.2,1.1755776405334473
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,4096,1536,8,128,2,16,power_law_1.2,2.057484817504883
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,4096,1536,8,128,4,8,balanced,0.03271466741959254
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,4096,1536,8,128,2,16,power_law_1.2,0.07667199969291687
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,4096,1536,8,128,4,8,balanced,0.03549333413441976
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,4096,1536,8,128,2,16,power_law_1.2,5.067193603515625
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,4096,1536,8,128,2,16,power_law_1.2,0.08366720080375671
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,4096,1536,8,128,4,8,balanced,0.03677333394686381
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,4096,1536,8,128,4,8,balanced,0.04717333118120829
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,4096,1536,8,128,4,8,balanced,0.06749866902828217
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,4096,1536,8,128,2,16,power_law_1.2,0.0852735996246338
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,4096,1536,8,128,4,8,balanced,0.0697866678237915
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,4096,1536,8,128,2,16,power_law_1.2,0.10737279653549195
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,4096,1536,8,128,4,8,balanced,0.06996266543865204
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,4096,1536,8,128,4,8,balanced,0.06889600058396657
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,4096,1536,8,128,2,16,power_law_1.2,0.12759679555892944
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,4096,1536,8,128,4,8,balanced,0.0688266654809316
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,4096,1536,8,128,4,8,balanced,0.0697866678237915
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,4096,1536,8,128,2,16,power_law_1.2,0.1633471965789795
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,4096,1536,8,128,4,8,balanced,0.07062399884064992
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,4096,1536,8,128,2,16,power_law_1.2,0.22071681022644044
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,4096,1536,8,128,4,8,balanced,0.07141333321730296
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,4096,1536,8,128,2,16,power_law_1.2,0.29453439712524415
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,4096,1536,8,128,4,8,balanced,0.07131200035413106
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,4096,1536,8,128,2,16,power_law_1.2,0.4035776138305664
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,4096,1536,8,128,4,8,balanced,0.0737066666285197
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,4096,1536,8,128,2,16,power_law_1.2,0.6858304023742676
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,4096,1536,8,128,4,8,balanced,0.07787199815114339
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,4096,1536,8,128,4,8,balanced,0.0779306689898173
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,4096,1536,8,128,2,16,power_law_1.2,0.8135231971740723
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,4096,1536,8,128,4,8,balanced,0.08313066760698955
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,4096,1536,8,128,2,16,power_law_1.2,1.1254015922546388
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,4096,1536,8,128,4,8,balanced,0.0876693328221639
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,4096,1536,8,128,2,16,power_law_1.2,1.7853759765625
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,4096,1536,8,128,4,8,balanced,0.09433066844940186
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,4096,1536,8,128,2,16,power_law_1.2,2.0207040786743162
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,4096,1536,8,128,4,8,balanced,0.10152000188827515
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,4096,1536,8,128,2,16,power_law_1.2,4.144051361083984
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,4096,1536,8,128,4,8,balanced,0.1132426659266154
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,4096,1536,8,128,2,16,power_law_1.2,8.489862060546875
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,4096,1536,8,128,4,8,balanced,0.03257066756486893
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,4096,1536,8,128,4,8,balanced,0.14537066221237183
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,4096,1536,8,128,4,8,balanced,0.03348266581694285
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,4096,1536,8,128,4,8,power_law_1.01,0.04711039960384369
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,4096,1536,8,128,4,8,balanced,0.03363200028737386
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,4096,1536,8,128,4,8,power_law_1.01,0.04809600114822388
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,4096,1536,8,128,4,8,balanced,0.15550933281580606
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,4096,1536,8,128,4,8,balanced,0.03878933439652125
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,4096,1536,8,128,4,8,power_law_1.01,0.040761598944664
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,4096,1536,8,128,4,8,balanced,0.05392533540725708
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,4096,1536,8,128,4,8,power_law_1.01,0.0523904025554657
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,4096,1536,8,128,4,8,balanced,0.05484800040721893
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,4096,1536,8,128,4,8,power_law_1.01,0.0383103996515274
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,4096,1536,8,128,4,8,balanced,0.23017066717147827
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,4096,1536,8,128,4,8,power_law_1.01,0.050406402349472045
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,4096,1536,8,128,4,8,balanced,0.055104002356529236
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,4096,1536,8,128,4,8,balanced,0.028442665934562683
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,4096,1536,8,128,4,8,power_law_1.01,0.06437119841575623
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,4096,1536,8,128,4,8,power_law_1.01,0.03901439905166626
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,4096,1536,8,128,4,8,balanced,0.05529066423575083
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,4096,1536,8,128,4,8,balanced,0.029792000850041706
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,4096,1536,8,128,4,8,power_law_1.01,0.0659775972366333
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,4096,1536,8,128,4,8,balanced,0.05557866891225179
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,4096,1536,8,128,4,8,power_law_1.01,0.03532800078392029
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,4096,1536,8,128,4,8,balanced,0.03028800090154012
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,4096,1536,8,128,4,8,balanced,0.035605333745479584
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,4096,1536,8,128,4,8,power_law_1.01,0.06661120057106018
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,4096,1536,8,128,4,8,power_law_1.01,0.040556800365447995
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,4096,1536,8,128,4,8,balanced,0.056159997979799904
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,4096,1536,8,128,4,8,balanced,0.04986133178075155
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,4096,1536,8,128,4,8,balanced,0.26977600653966266
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,4096,1536,8,128,4,8,balanced,0.05102399984995524
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,4096,1536,8,128,4,8,balanced,0.05725333094596863
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,4096,1536,8,128,4,8,power_law_1.01,0.04325760006904602
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,4096,1536,8,128,4,8,power_law_1.01,0.06875519752502442
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,4096,1536,8,128,4,8,balanced,0.051594664653142296
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,4096,1536,8,128,4,8,balanced,0.057706668972969055
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,4096,1536,8,128,4,8,power_law_1.01,0.051020801067352295
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,4096,1536,8,128,4,8,power_law_1.01,0.07200000286102295
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,4096,1536,8,128,4,8,balanced,0.052229334910710655
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,4096,1536,8,128,4,8,balanced,0.052389333645502724
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,4096,1536,8,128,4,8,balanced,0.058517331878344216
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,4096,1536,8,128,4,8,power_law_1.01,0.05243520140647888
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,4096,1536,8,128,4,8,power_law_1.01,0.07352960109710693
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,4096,1536,8,128,4,8,balanced,0.05323733389377594
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,4096,1536,8,128,4,8,balanced,0.060346667965253196
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,4096,1536,8,128,4,8,power_law_1.01,0.07697920203208923
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,4096,1536,8,128,4,8,power_law_1.01,0.054041600227355956
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,4096,1536,8,128,4,8,balanced,0.055071999629338585
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,4096,1536,8,128,4,8,balanced,0.05625600119431814
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,4096,1536,8,128,4,8,power_law_1.01,0.0780672013759613
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,4096,1536,8,128,4,8,balanced,0.06573866804440816
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,4096,1536,8,128,4,8,power_law_1.01,0.05514240264892578
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,4096,1536,8,128,4,8,balanced,0.05818133552869161
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,4096,1536,8,128,4,8,balanced,0.3962666591008504
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,4096,1536,8,128,4,8,power_law_1.01,0.08238720297813415
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,4096,1536,8,128,4,8,power_law_1.01,0.053235197067260744
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,4096,1536,8,128,4,8,balanced,0.06669866542021434
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,4096,1536,8,128,4,8,balanced,0.05881600081920624
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,4096,1536,8,128,4,8,power_law_1.01,0.0898688018321991
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,4096,1536,8,128,4,8,power_law_1.01,0.05797759890556335
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,4096,1536,8,128,4,8,balanced,0.0705813318490982
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,4096,1536,8,128,4,8,power_law_1.01,0.09160959720611572
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,4096,1536,8,128,4,8,power_law_1.01,0.06287360191345215
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,4096,1536,8,128,4,8,balanced,0.07843733330567677
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,4096,1536,8,128,4,8,power_law_1.01,0.09607679843902588
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,4096,1536,8,128,4,8,power_law_1.01,0.06665599942207337
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,4096,1536,8,128,4,8,balanced,0.08458667000134786
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,4096,1536,8,128,4,8,balanced,0.06637333333492279
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,4096,1536,8,128,4,8,power_law_1.01,0.10718079805374145
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,4096,1536,8,128,4,8,power_law_1.01,0.06401280164718628
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,4096,1536,8,128,4,8,balanced,0.06649599969387054
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,4096,1536,8,128,4,8,balanced,0.09475200374921162
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,4096,1536,8,128,4,8,power_law_1.01,0.07297919988632202
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,4096,1536,8,128,4,8,power_law_1.01,0.1224511981010437
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,4096,1536,8,128,4,8,power_law_1.01,0.14131840467453002
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,4096,1536,8,128,4,8,power_law_1.01,0.07694079875946044
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,4096,1536,8,128,4,8,balanced,0.47520001729329425
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,4096,1536,8,128,4,8,balanced,0.10875200231870015
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,4096,1536,8,128,4,8,power_law_1.01,0.1680575966835022
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,4096,1536,8,128,4,8,power_law_1.01,0.08531200289726257
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,4096,1536,8,128,4,8,power_law_1.01,0.21463680267333984
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,4096,1536,8,128,4,8,power_law_1.01,0.0934656023979187
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,4096,1536,8,128,4,8,balanced,0.14567466576894125
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,4096,1536,8,128,4,8,balanced,0.07632533212502797
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,4096,1536,8,128,4,8,power_law_1.01,0.23767681121826173
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,4096,1536,8,128,4,8,power_law_1.01,0.10206079483032227
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,4096,1536,8,128,4,8,balanced,0.08764266967773438
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,4096,1536,8,128,4,8,power_law_1.01,0.12186880111694336
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,4096,1536,8,128,4,8,power_law_1.01,0.31924479007720946
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,4096,1536,8,128,4,8,balanced,0.1663093368212382
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,4096,1536,8,128,4,8,balanced,0.09136533737182617
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,4096,1536,8,128,4,8,power_law_1.01,0.14789119958877564
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,4096,1536,8,128,4,8,power_law_1.01,0.4437119960784912
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,4096,1536,8,128,4,8,power_law_1.01,0.2105407953262329
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,4096,1536,8,128,4,8,power_law_1.01,0.5148608207702636
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,4096,1536,8,128,4,8,power_law_1.01,0.2257024049758911
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,4096,1536,8,128,4,8,power_law_1.01,0.8005696296691894
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,4096,1536,8,128,4,8,balanced,0.24444266160329184
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,4096,1536,8,128,4,8,balanced,0.5965173244476318
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,4096,1536,8,128,4,8,power_law_1.01,0.3450239896774292
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,4096,1536,8,128,4,8,balanced,0.11582400401433308
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,4096,1536,8,128,4,8,power_law_1.01,0.9817791938781738
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,4096,1536,8,128,4,8,power_law_1.01,0.4082047939300537
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,4096,1536,8,128,4,8,power_law_1.01,1.612268829345703
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,4096,1536,8,128,4,8,balanced,0.13090133666992188
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,4096,1536,8,128,4,8,power_law_1.01,0.6142079830169678
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,4096,1536,8,128,4,8,power_law_1.01,0.8252799987792969
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,4096,1536,8,128,4,8,power_law_1.01,3.086675262451172
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,4096,1536,8,128,4,8,balanced,0.1949653426806132
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,4096,1536,8,128,4,8,balanced,0.2967573404312134
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,4096,1536,8,128,4,8,power_law_1.01,1.0267647743225097
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,4096,1536,8,128,4,8,power_law_1.01,0.036371201276779175
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,4096,1536,8,128,4,8,balanced,0.2441920042037964
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,4096,1536,8,128,4,8,power_law_1.01,0.03500159978866577
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,4096,1536,8,128,4,8,power_law_1.01,1.5566143989562988
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,4096,1536,8,128,4,8,power_law_1.01,0.03253760039806366
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,4096,1536,8,128,4,8,power_law_1.01,3.5233535766601562
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,4096,1536,8,128,4,8,power_law_1.01,0.03938559889793396
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,4096,1536,8,128,4,8,balanced,0.3527093331019084
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,4096,1536,8,128,4,8,balanced,0.43298665682474774
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,4096,1536,8,128,4,8,power_law_1.01,0.04213759899139404
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,4096,1536,8,128,4,8,power_law_1.01,0.04986239969730377
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,4096,1536,8,128,4,8,power_law_1.01,0.05170559883117676
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,4096,1536,8,128,4,8,balanced,0.4535626570383708
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,4096,1536,8,128,4,8,power_law_1.01,0.053830397129058835
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,4096,1536,8,128,4,8,balanced,0.8778346379597982
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,4096,1536,8,128,4,8,power_law_1.01,0.05483520030975342
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,4096,1536,8,128,4,8,power_law_1.01,0.057145601511001586
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,4096,1536,8,128,4,8,power_law_1.01,0.061913597583770755
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,4096,1536,8,128,4,8,balanced,0.547599991162618
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,4096,1536,8,128,4,8,power_law_1.01,0.06622719764709473
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,4096,1536,8,128,4,8,balanced,0.6680106321970621
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,4096,1536,8,128,4,8,power_law_1.01,0.06643840074539184
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,4096,1536,8,128,4,8,power_law_1.01,0.07491199970245362
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,4096,1536,8,128,4,8,power_law_1.01,0.0851967990398407
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,4096,1536,8,128,4,8,power_law_1.01,0.08630399703979492
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,4096,1536,8,128,4,8,power_law_1.2,0.04752640128135681
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,4096,1536,8,128,4,8,balanced,0.8662506739298502
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,4096,1536,8,128,4,8,balanced,0.6867626508076986
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,4096,1536,8,128,4,8,power_law_1.2,0.03906559944152832
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,4096,1536,8,128,4,8,power_law_1.2,0.03986560106277466
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,4096,1536,8,128,4,8,power_law_1.01,0.09464319944381713
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,4096,1536,8,128,4,8,power_law_1.2,0.045587199926376346
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,4096,1536,8,128,4,8,power_law_1.01,0.10764800310134888
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,4096,1536,8,128,4,8,power_law_1.2,0.05304960012435913
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,4096,1536,8,128,4,8,power_law_1.2,0.06548479795455933
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,4096,1536,8,128,4,8,power_law_1.01,0.13741439580917358
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,4096,1536,8,128,4,8,power_law_1.2,0.066348797082901
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,4096,1536,8,128,4,8,power_law_1.2,0.06851199865341187
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,4096,1536,8,128,4,8,power_law_1.01,0.15948159694671632
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,4096,1536,8,128,4,8,power_law_1.2,0.06869120001792908
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,4096,1536,8,128,4,8,power_law_1.01,0.20881280899047852
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,4096,1536,8,128,4,8,power_law_1.2,0.07300480008125305
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,4096,1536,8,128,4,8,balanced,1.0810986359914143
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,4096,1536,8,128,4,8,power_law_1.2,0.07591040134429931
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,4096,1536,8,128,4,8,power_law_1.01,0.33183999061584474
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,4096,1536,8,128,4,8,power_law_1.2,0.07790719866752624
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,4096,1536,8,128,4,8,power_law_1.01,0.3763904094696045
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,4096,1536,8,128,4,8,power_law_1.2,0.08049280047416688
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,4096,1536,8,128,4,8,power_law_1.2,0.08097280263900757
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,4096,1536,8,128,4,8,power_law_1.01,0.5381311893463134
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,4096,1536,8,128,4,8,power_law_1.2,0.09231359958648681
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,4096,1536,8,128,4,8,balanced,1.028165340423584
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,4096,1536,8,128,4,8,power_law_1.01,0.8365056037902832
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,4096,1536,8,128,4,8,power_law_1.2,0.09635199904441834
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,4096,1536,8,128,4,8,power_law_1.2,0.09985920190811157
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,4096,1536,8,128,4,8,power_law_1.01,1.0900992393493651
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,4096,1536,8,128,4,8,balanced,1.7067467371622722
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,4096,1536,8,128,4,8,power_law_1.2,0.11207679510116578
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,4096,1536,8,128,4,8,power_law_1.01,1.4218624114990235
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,4096,1536,8,128,4,8,power_law_1.2,0.12919679880142212
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,4096,1536,8,128,4,8,power_law_1.01,1.9305408477783204
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,4096,1536,8,128,4,8,power_law_1.2,0.1447424054145813
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,4096,1536,8,128,4,8,power_law_1.2,0.18521599769592284
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,4096,1536,8,128,4,8,power_law_1.01,2.62728328704834
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,4096,1536,8,128,4,8,power_law_1.2,0.23868160247802733
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,4096,1536,8,128,4,8,balanced,1.7070666948954265
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,4096,1536,8,128,4,8,power_law_1.2,0.25706241130828855
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,4096,1536,8,128,4,8,power_law_1.01,6.09436149597168
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,4096,1536,8,128,4,8,power_law_1.2,0.03834879994392395
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,4096,1536,8,128,4,8,power_law_1.2,0.4301119804382324
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,4096,1536,8,128,4,8,power_law_1.2,0.03436799943447113
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,4096,1536,8,128,4,8,power_law_1.2,0.45777277946472167
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,4096,1536,8,128,4,8,power_law_1.2,0.034143999218940735
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,4096,1536,8,128,4,8,power_law_1.2,0.7494143962860107
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,4096,1536,8,128,4,8,power_law_1.2,0.0401856005191803
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,4096,1536,8,128,4,8,power_law_1.2,0.970400047302246
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,4096,1536,8,128,4,8,power_law_1.2,0.04147840142250061
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,4096,1536,8,128,4,8,power_law_1.2,1.287929630279541
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,4096,1536,8,128,4,8,power_law_1.2,0.05148800015449524
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,4096,1536,8,128,4,8,power_law_1.2,2.7733760833740235
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,4096,1536,8,128,4,8,power_law_1.2,0.054054397344589236
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,4096,1536,8,128,4,8,power_law_1.2,0.05379199981689453
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,4096,1536,8,128,4,8,power_law_1.2,3.708563232421875
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,4096,1536,8,128,4,8,power_law_1.2,0.05454080104827881
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,4096,1536,8,128,4,8,power_law_1.2,0.05666559934616089
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,4096,1536,8,128,4,8,power_law_1.2,0.05851519703865051
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,4096,1536,8,128,4,8,power_law_1.2,0.0649728000164032
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,4096,1536,8,128,4,8,power_law_1.2,0.07009919881820678
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,4096,1536,8,128,4,8,power_law_1.2,0.06736000180244446
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,4096,1536,8,128,4,8,balanced,2.001413345336914
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,4096,1536,8,128,4,8,power_law_1.2,0.07517439723014832
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,4096,1536,8,128,4,8,power_law_1.2,0.07714560031890869
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,4096,1536,8,128,4,8,power_law_1.2,0.08687360286712646
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,4096,1536,8,128,4,8,power_law_1.2,0.09428480267524719
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,4096,1536,8,128,4,8,power_law_1.2,0.11013120412826538
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,4096,1536,8,128,4,8,power_law_1.2,0.13288320302963258
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,4096,1536,8,128,4,8,balanced,3.3701279958089194
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,4096,1536,8,128,4,8,power_law_1.2,0.15635839700698853
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,4096,1536,8,128,4,8,power_law_1.2,0.22973439693450928
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,4096,1536,8,128,4,8,power_law_1.2,0.25902719497680665
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,4096,1536,8,128,4,8,power_law_1.2,0.3571968078613281
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,4096,1536,8,128,4,8,power_law_1.2,0.5149119853973388
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,4096,1536,8,128,4,8,power_law_1.2,0.7580863952636718
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,4096,1536,8,128,4,8,power_law_1.2,1.0471360206604003
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,4096,1536,8,128,4,8,power_law_1.2,1.304652786254883
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,4096,1536,8,128,4,8,power_law_1.2,1.9939456939697267
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,4096,1536,8,128,4,8,power_law_1.2,4.506860733032227
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,4096,1536,8,128,8,4,balanced,0.03571200122435888
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,4096,1536,8,128,8,4,balanced,0.0373279998699824
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,4096,1536,8,128,8,4,balanced,0.04001600046952566
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,4096,1536,8,128,8,4,balanced,0.053930665055910744
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,4096,1536,8,128,8,4,balanced,0.07000533243020375
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,4096,1536,8,128,4,8,power_law_1.2,0.03648639917373657
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,4096,1536,8,128,8,4,balanced,0.07157333195209503
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,4096,1536,8,128,4,8,power_law_1.2,0.032364800572395325
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,4096,1536,8,128,8,4,balanced,0.07167466481526692
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,4096,1536,8,128,4,8,power_law_1.2,0.034892800450325015
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,4096,1536,8,128,8,4,balanced,0.07233066856861115
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,4096,1536,8,128,4,8,power_law_1.2,0.03824639916419983
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,4096,1536,8,128,8,4,balanced,0.07208000123500824
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,4096,1536,8,128,8,4,balanced,0.07348800202210744
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,4096,1536,8,128,4,8,power_law_1.2,0.040838399529457094
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,4096,1536,8,128,8,4,balanced,0.07411199808120728
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,4096,1536,8,128,4,8,power_law_1.2,0.05121920108795166
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,4096,1536,8,128,8,4,balanced,0.07576000193754832
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,4096,1536,8,128,4,8,power_law_1.2,0.052160000801086424
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,4096,1536,8,128,8,4,balanced,0.07850133379300435
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,4096,1536,8,128,4,8,power_law_1.2,0.05389440059661865
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,4096,1536,8,128,8,4,balanced,0.07785066465536754
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,4096,1536,8,128,4,8,power_law_1.2,0.05490559935569763
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,4096,1536,8,128,4,8,power_law_1.2,0.05909759998321533
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,4096,1536,8,128,8,4,balanced,0.08515733480453491
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,4096,1536,8,128,4,8,power_law_1.2,0.06175360083580017
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,4096,1536,8,128,8,4,balanced,0.08690133690834045
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,4096,1536,8,128,4,8,power_law_1.2,0.06815360188484192
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,4096,1536,8,128,8,4,balanced,0.09427733222643535
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,4096,1536,8,128,4,8,power_law_1.2,0.06821759939193725
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,4096,1536,8,128,8,4,balanced,0.10241599877675374
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,4096,1536,8,128,4,8,power_law_1.2,0.07835519909858704
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,4096,1536,8,128,8,4,balanced,0.10723732908566792
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,4096,1536,8,128,4,8,power_law_1.2,0.0821951985359192
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,4096,1536,8,128,8,4,balanced,0.1225386659304301
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,4096,1536,8,128,4,8,power_law_1.2,0.08885120153427124
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,4096,1536,8,128,8,4,balanced,0.13740266362826029
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,4096,1536,8,128,4,8,power_law_1.2,0.09528319835662842
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,4096,1536,8,128,8,4,balanced,0.18581867218017578
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,4096,1536,8,128,4,8,power_law_1.2,0.11813119649887086
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,4096,1536,8,128,4,8,power_law_1.2,0.14172159433364867
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,4096,1536,8,128,8,4,balanced,0.21708800395329794
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,4096,1536,8,128,4,8,power_law_1.2,0.1775871992111206
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,4096,1536,8,128,4,8,power_law_1.2,0.24031999111175537
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,4096,1536,8,128,4,8,power_law_1.2,0.32911360263824463
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,4096,1536,8,128,8,4,balanced,0.3030986587206523
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,4096,1536,8,128,4,8,power_law_1.2,0.45212159156799314
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,4096,1536,8,128,8,4,balanced,0.03281066566705704
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,4096,1536,8,128,4,8,power_law_1.2,0.6182655811309814
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,4096,1536,8,128,8,4,balanced,0.03346133232116699
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,4096,1536,8,128,4,8,power_law_1.2,0.9126655578613281
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,4096,1536,8,128,8,4,balanced,0.035349334279696144
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,4096,1536,8,128,8,4,balanced,0.38386666774749756
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,4096,1536,8,128,8,4,balanced,0.04233600199222565
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,4096,1536,8,128,4,8,power_law_1.2,1.7510335922241211
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,4096,1536,8,128,8,4,balanced,0.0591786652803421
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,4096,1536,8,128,4,8,power_law_1.2,2.2333311080932616
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,4096,1536,8,128,8,4,balanced,0.060085331400235496
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,4096,1536,8,128,8,4,balanced,0.060032000144322716
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,4096,1536,8,128,4,8,power_law_1.2,2.2400447845458986
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,4096,1536,8,128,8,4,balanced,0.06081599990526835
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,4096,1536,8,128,8,4,balanced,0.06121600170930227
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,4096,1536,8,128,4,8,power_law_1.2,3.8735424041748048
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,4096,1536,8,128,8,4,balanced,0.5633600155512491
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,4096,1536,8,128,8,4,balanced,0.06189866860707601
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,4096,1536,8,128,8,4,balanced,0.0621973325808843
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,4096,1536,8,128,4,8,power_law_1.2,8.966796875
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,4096,1536,8,128,8,4,balanced,0.0639519989490509
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,4096,1536,8,128,8,4,balanced,0.06589333216349284
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,4096,1536,8,128,8,4,balanced,0.0677706648906072
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,4096,1536,8,128,8,4,balanced,0.07436266541481018
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,4096,1536,8,128,8,4,balanced,0.03396799912055334
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,4096,1536,8,128,8,4,balanced,0.07575466732184093
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,4096,1536,8,128,8,4,balanced,0.03541333228349686
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,4096,1536,8,128,8,4,balanced,0.7009653250376383
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,4096,1536,8,128,8,4,balanced,0.03669333209594091
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,4096,1536,8,128,8,4,balanced,0.08358933528264363
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,4096,1536,8,128,8,4,power_law_1.01,0.03930880129337311
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,4096,1536,8,128,8,4,balanced,0.043194666504859924
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,4096,1536,8,128,8,4,balanced,0.09377066294352214
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,4096,1536,8,128,8,4,power_law_1.01,0.04225279986858368
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,4096,1536,8,128,8,4,balanced,0.0588319996992747
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,4096,1536,8,128,8,4,power_law_1.01,0.03860479891300202
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,4096,1536,8,128,8,4,balanced,0.10213866829872131
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,4096,1536,8,128,8,4,balanced,0.06006399790445963
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,4096,1536,8,128,8,4,power_law_1.01,0.05056639909744263
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,4096,1536,8,128,8,4,balanced,0.06125866870085398
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,4096,1536,8,128,8,4,balanced,0.11815466483434041
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,4096,1536,8,128,8,4,balanced,0.06165333092212677
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,4096,1536,8,128,8,4,power_law_1.01,0.05552639961242676
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,4096,1536,8,128,8,4,power_law_1.01,0.035795199871063235
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,4096,1536,8,128,8,4,balanced,0.06274666885534923
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,4096,1536,8,128,8,4,power_law_1.01,0.06838399767875672
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,4096,1536,8,128,8,4,balanced,0.13337600231170654
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,4096,1536,8,128,8,4,power_law_1.01,0.03528960049152374
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,4096,1536,8,128,8,4,balanced,0.06398933132489522
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,4096,1536,8,128,8,4,power_law_1.01,0.06631039977073669
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,4096,1536,8,128,8,4,power_law_1.01,0.0363072007894516
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,4096,1536,8,128,8,4,balanced,0.06593066453933716
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,4096,1536,8,128,8,4,balanced,0.879040002822876
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,4096,1536,8,128,8,4,power_law_1.01,0.06773120164871216
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,4096,1536,8,128,8,4,power_law_1.01,0.04318720102310181
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,4096,1536,8,128,8,4,balanced,0.19097065925598145
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,4096,1536,8,128,8,4,balanced,0.06834133466084798
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,4096,1536,8,128,8,4,power_law_1.01,0.0463808000087738
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,4096,1536,8,128,8,4,power_law_1.01,0.07204480171203613
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,4096,1536,8,128,8,4,power_law_1.01,0.05514240264892578
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,4096,1536,8,128,8,4,balanced,0.07063999772071838
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,4096,1536,8,128,8,4,power_law_1.01,0.07523840069770812
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,4096,1536,8,128,8,4,power_law_1.01,0.05569919943809509
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,4096,1536,8,128,8,4,balanced,0.0735040009021759
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,4096,1536,8,128,8,4,power_law_1.01,0.05863680243492127
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,4096,1536,8,128,8,4,balanced,0.22175999482472739
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,4096,1536,8,128,8,4,power_law_1.01,0.07982079982757569
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,4096,1536,8,128,8,4,power_law_1.01,0.06165760159492493
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,4096,1536,8,128,8,4,power_law_1.01,0.08049920201301575
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,4096,1536,8,128,8,4,power_law_1.01,0.06496000289916992
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,4096,1536,8,128,8,4,power_law_1.01,0.08634880185127258
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,4096,1536,8,128,8,4,power_law_1.01,0.0663424015045166
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,4096,1536,8,128,8,4,power_law_1.01,0.07164160013198853
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,4096,1536,8,128,8,4,power_law_1.01,0.7916736125946044
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,4096,1536,8,128,8,4,balanced,0.3333973487218221
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,4096,1536,8,128,8,4,balanced,0.08549867073694865
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,4096,1536,8,128,8,4,power_law_1.01,0.07537919878959656
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,4096,1536,8,128,8,4,power_law_1.01,0.7944064140319824
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,4096,1536,8,128,8,4,balanced,0.08667733271916707
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,4096,1536,8,128,8,4,power_law_1.01,0.07593600153923034
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,4096,1536,8,128,8,4,power_law_1.01,0.8038528442382813
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,4096,1536,8,128,8,4,power_law_1.01,0.03787519931793213
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,4096,1536,8,128,8,4,power_law_1.01,0.08414080142974853
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,4096,1536,8,128,8,4,power_law_1.01,0.1118016004562378
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,4096,1536,8,128,8,4,power_law_1.01,0.08915200233459472
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,4096,1536,8,128,8,4,power_law_1.01,0.036032000184059144
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,4096,1536,8,128,8,4,power_law_1.01,0.1245568037033081
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,4096,1536,8,128,8,4,balanced,0.4293653170267741
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,4096,1536,8,128,8,4,power_law_1.01,0.09775360226631165
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,4096,1536,8,128,8,4,power_law_1.01,0.03787519931793213
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,4096,1536,8,128,8,4,power_law_1.01,0.11294080018997192
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,4096,1536,8,128,8,4,power_law_1.01,0.1274880051612854
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,4096,1536,8,128,8,4,power_law_1.01,0.12046719789505005
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,4096,1536,8,128,8,4,power_law_1.01,0.0446399986743927
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,4096,1536,8,128,8,4,power_law_1.01,0.16421760320663453
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,4096,1536,8,128,8,4,balanced,0.10019733508427937
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,4096,1536,8,128,8,4,balanced,1.3066346645355225
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,4096,1536,8,128,8,4,power_law_1.01,0.14709119796752929
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,4096,1536,8,128,8,4,power_law_1.01,0.04924800097942352
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,4096,1536,8,128,8,4,power_law_1.01,0.1842687964439392
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,4096,1536,8,128,8,4,power_law_1.01,0.17966079711914062
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,4096,1536,8,128,8,4,balanced,0.11910399794578552
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,4096,1536,8,128,8,4,power_law_1.01,0.058348798751831056
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,4096,1536,8,128,8,4,power_law_1.01,0.23825280666351317
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,4096,1536,8,128,8,4,power_law_1.01,0.22909440994262695
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,4096,1536,8,128,8,4,balanced,0.1267039974530538
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,4096,1536,8,128,8,4,power_law_1.01,0.06041600108146668
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,4096,1536,8,128,8,4,power_law_1.01,0.28392319679260253
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,4096,1536,8,128,8,4,power_law_1.01,0.28047358989715576
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,4096,1536,8,128,8,4,power_law_1.01,0.3884351968765259
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,4096,1536,8,128,8,4,balanced,0.6339573462804159
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,4096,1536,8,128,8,4,power_law_1.01,0.061312001943588254
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,4096,1536,8,128,8,4,power_law_1.01,0.41709442138671876
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,4096,1536,8,128,8,4,power_law_1.01,0.5307583808898926
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,4096,1536,8,128,8,4,power_law_1.01,0.06462079882621766
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,4096,1536,8,128,8,4,power_law_1.01,0.7301568031311035
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,4096,1536,8,128,8,4,power_law_1.01,0.4805056095123291
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,4096,1536,8,128,8,4,power_law_1.01,0.06746879816055298
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,4096,1536,8,128,8,4,power_law_1.01,0.9418239593505859
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,4096,1536,8,128,8,4,power_law_1.01,0.7099775791168212
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,4096,1536,8,128,8,4,balanced,0.1776640017827352
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,4096,1536,8,128,8,4,power_law_1.01,0.07169280052185059
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,4096,1536,8,128,8,4,power_law_1.2,0.038771200180053714
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,4096,1536,8,128,8,4,power_law_1.01,1.1862848281860352
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,4096,1536,8,128,8,4,power_law_1.01,0.07612800002098083
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,4096,1536,8,128,8,4,power_law_1.01,0.9759552001953125
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,4096,1536,8,128,8,4,power_law_1.2,0.03609600067138672
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,4096,1536,8,128,8,4,power_law_1.01,1.9204992294311523
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,4096,1536,8,128,8,4,balanced,0.22206934293111166
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,4096,1536,8,128,8,4,power_law_1.01,0.08229119777679443
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,4096,1536,8,128,8,4,power_law_1.2,0.04069119989871979
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,4096,1536,8,128,8,4,power_law_1.01,1.187609577178955
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,4096,1536,8,128,8,4,power_law_1.01,3.8437374114990233
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,4096,1536,8,128,8,4,power_law_1.01,0.0930239975452423
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,4096,1536,8,128,8,4,power_law_1.2,0.04956159889698029
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,4096,1536,8,128,8,4,balanced,0.8196533521016439
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,4096,1536,8,128,8,4,balanced,0.33510398864746094
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,4096,1536,8,128,8,4,power_law_1.01,1.8093631744384766
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,4096,1536,8,128,8,4,power_law_1.2,0.05440000295639038
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,4096,1536,8,128,8,4,power_law_1.01,0.10146559476852417
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,4096,1536,8,128,8,4,power_law_1.2,0.06776959896087646
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,4096,1536,8,128,8,4,power_law_1.01,3.784473419189453
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,4096,1536,8,128,8,4,balanced,0.40724798043568927
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,4096,1536,8,128,8,4,power_law_1.2,0.06739839911460876
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,4096,1536,8,128,8,4,power_law_1.01,0.11075199842453003
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,4096,1536,8,128,8,4,power_law_1.2,0.07346559762954712
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,4096,1536,8,128,8,4,power_law_1.2,0.07553279995918274
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,4096,1536,8,128,8,4,power_law_1.01,0.11953279972076417
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,4096,1536,8,128,8,4,balanced,0.586357315381368
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,4096,1536,8,128,8,4,power_law_1.2,0.07779840230941773
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,4096,1536,8,128,8,4,power_law_1.01,0.14118399620056152
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,4096,1536,8,128,8,4,power_law_1.2,0.08047999739646912
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,4096,1536,8,128,8,4,power_law_1.01,0.165011203289032
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,4096,1536,8,128,8,4,power_law_1.2,0.08369920253753663
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,4096,1536,8,128,8,4,balanced,1.0236799716949463
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,4096,1536,8,128,8,4,power_law_1.2,0.08850560188293458
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,4096,1536,8,128,8,4,power_law_1.01,0.23071999549865724
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,4096,1536,8,128,8,4,balanced,0.7609226703643799
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,4096,1536,8,128,8,4,power_law_1.01,0.32441599369049073
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,4096,1536,8,128,8,4,power_law_1.2,0.7823872089385986
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,4096,1536,8,128,8,4,power_law_1.01,0.42542080879211425
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,4096,1536,8,128,8,4,power_law_1.2,0.7984320163726807
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,4096,1536,8,128,8,4,power_law_1.01,0.5229695796966553
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,4096,1536,8,128,8,4,power_law_1.2,0.8065919876098633
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,4096,1536,8,128,8,4,balanced,2.5381973584493003
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,4096,1536,8,128,8,4,power_law_1.01,0.8427328109741211
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,4096,1536,8,128,8,4,power_law_1.2,0.11581439971923828
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,4096,1536,8,128,8,4,power_law_1.01,0.9667263984680176
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,4096,1536,8,128,8,4,balanced,1.1219840049743652
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,4096,1536,8,128,8,4,power_law_1.2,0.12758400440216064
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,4096,1536,8,128,8,4,power_law_1.01,1.51975679397583
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,4096,1536,8,128,8,4,power_law_1.2,0.14177279472351073
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,4096,1536,8,128,8,4,power_law_1.2,0.1643839955329895
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,4096,1536,8,128,8,4,power_law_1.01,2.120716857910156
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,4096,1536,8,128,8,4,power_law_1.2,0.2064255952835083
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,4096,1536,8,128,8,4,power_law_1.01,2.445996856689453
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,4096,1536,8,128,8,4,power_law_1.2,0.24177279472351074
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,4096,1536,8,128,8,4,power_law_1.01,4.029996871948242
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,4096,1536,8,128,8,4,power_law_1.2,0.30529279708862306
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,4096,1536,8,128,8,4,balanced,1.5251839955647786
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,4096,1536,8,128,8,4,balanced,1.4728585879007976
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,4096,1536,8,128,8,4,power_law_1.2,0.4415872097015381
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,4096,1536,8,128,8,4,power_law_1.01,7.226470184326172
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,4096,1536,8,128,8,4,power_law_1.2,0.5750847816467285
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,4096,1536,8,128,8,4,power_law_1.2,0.7503039836883545
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,4096,1536,8,128,8,4,power_law_1.2,1.173043155670166
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,4096,1536,8,128,8,4,power_law_1.2,1.2210880279541017
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,4096,1536,8,128,8,4,power_law_1.2,2.1170623779296873
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,4096,1536,8,128,8,4,balanced,1.8382347424825032
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,4096,1536,8,128,8,4,power_law_1.2,5.330899047851562
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,4096,1536,8,128,8,4,power_law_1.2,0.03583999872207642
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,4096,1536,8,128,8,4,power_law_1.2,0.03370240032672882
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,4096,1536,8,128,8,4,power_law_1.2,0.03760640025138855
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,4096,1536,8,128,8,4,power_law_1.2,0.04154880046844482
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,4096,1536,8,128,8,4,balanced,2.9129813512166343
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,4096,1536,8,128,8,4,power_law_1.2,0.04436480104923248
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,4096,1536,8,128,8,4,power_law_1.2,0.05516800284385681
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,4096,1536,8,128,8,4,power_law_1.2,0.05800960063934326
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,4096,1536,8,128,8,4,power_law_1.2,0.06097919940948486
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,4096,1536,8,128,8,4,balanced,2.9848000208536782
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,4096,1536,8,128,8,4,power_law_1.2,0.06328960061073304
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,4096,1536,8,128,8,4,power_law_1.2,0.06704639792442321
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,4096,1536,8,128,8,4,power_law_1.2,0.07032960057258605
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,4096,1536,8,128,8,4,power_law_1.2,0.070278400182724
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,4096,1536,8,128,8,4,power_law_1.2,0.0755840003490448
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,4096,1536,8,128,8,4,power_law_1.2,0.07740799784660339
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,4096,1536,8,128,8,4,power_law_1.2,0.0883840024471283
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,4096,1536,8,128,8,4,power_law_1.2,0.09128959774971009
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,4096,1536,8,128,8,4,power_law_1.2,0.09811840057373047
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,4096,1536,8,128,8,4,power_law_1.2,0.11474560499191284
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,4096,1536,8,128,8,4,power_law_1.2,0.13523839712142943
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,4096,1536,8,128,8,4,power_law_1.2,0.15512319803237914
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,4096,1536,8,128,8,4,power_law_1.2,0.17059839963912965
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,4096,1536,8,128,8,4,power_law_1.2,0.2575167894363403
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,4096,1536,8,128,8,4,power_law_1.2,0.3084223985671997
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,4096,1536,8,128,8,4,power_law_1.2,0.5043200016021728
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,4096,1536,8,128,8,4,power_law_1.2,0.5643583774566651
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,4096,1536,8,128,8,4,power_law_1.2,0.8336319923400879
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,4096,1536,8,128,8,4,power_law_1.2,1.5440832138061524
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,4096,1536,8,128,8,4,power_law_1.2,1.566368007659912
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,4096,1536,8,128,8,4,balanced,5.770522435506185
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,4096,1536,8,128,8,4,power_law_1.2,2.6469696044921873
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,4096,1536,8,128,8,4,power_law_1.2,5.063961410522461
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,4096,1536,8,128,16,2,balanced,0.036805334190527596
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,4096,1536,8,128,16,2,balanced,0.04340266684691111
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,4096,1536,8,128,16,2,balanced,0.042725334564844765
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,4096,1536,8,128,16,2,balanced,0.05787733197212219
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,4096,1536,8,128,8,4,power_law_1.2,0.03758080005645752
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,4096,1536,8,128,16,2,balanced,0.08165866633256276
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,4096,1536,8,128,16,2,balanced,0.08347733815511067
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,4096,1536,8,128,8,4,power_law_1.2,0.03670400083065033
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,4096,1536,8,128,16,2,balanced,0.08272533118724823
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,4096,1536,8,128,8,4,power_law_1.2,0.0383679986000061
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,4096,1536,8,128,16,2,balanced,0.08455999692281087
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,4096,1536,8,128,8,4,power_law_1.2,0.043372800946235655
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,4096,1536,8,128,16,2,balanced,0.08620267113049825
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,4096,1536,8,128,8,4,power_law_1.2,0.04627200067043304
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,4096,1536,8,128,16,2,balanced,0.08676266670227051
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,4096,1536,8,128,8,4,power_law_1.2,0.05922560095787048
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,4096,1536,8,128,16,2,balanced,0.08866666754086812
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,4096,1536,8,128,8,4,power_law_1.2,0.0627839982509613
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,4096,1536,8,128,16,2,balanced,0.09071999788284302
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,4096,1536,8,128,8,4,power_law_1.2,0.06394240260124207
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,4096,1536,8,128,16,2,balanced,0.09186666210492452
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,4096,1536,8,128,8,4,power_law_1.2,0.06606720089912414
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,4096,1536,8,128,8,4,power_law_1.2,0.06800000071525573
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,4096,1536,8,128,16,2,balanced,0.09489599863688152
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,4096,1536,8,128,8,4,power_law_1.2,0.07371519804000855
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,4096,1536,8,128,16,2,balanced,0.10124799609184265
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,4096,1536,8,128,8,4,power_law_1.2,0.08025599718093872
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,4096,1536,8,128,16,2,balanced,0.03420799970626831
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,4096,1536,8,128,16,2,balanced,0.10371733705202739
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,4096,1536,8,128,8,4,power_law_1.2,0.08514559864997864
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,4096,1536,8,128,8,4,power_law_1.2,0.09233919978141784
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,4096,1536,8,128,16,2,balanced,0.11573333541552226
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,4096,1536,8,128,16,2,balanced,0.03542399903138479
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,4096,1536,8,128,16,2,balanced,0.038959999879201256
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,4096,1536,8,128,16,2,balanced,0.12968533237775168
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,4096,1536,8,128,8,4,power_law_1.2,0.10629760026931763
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,4096,1536,8,128,16,2,balanced,0.049125333627065025
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,4096,1536,8,128,16,2,balanced,0.1463520030180613
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,4096,1536,8,128,8,4,power_law_1.2,0.10789120197296143
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,4096,1536,8,128,16,2,balanced,0.06937600175539653
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,4096,1536,8,128,16,2,balanced,0.07047466437021892
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,4096,1536,8,128,16,2,balanced,0.16895999511082968
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,4096,1536,8,128,16,2,balanced,0.07129066685835521
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,4096,1536,8,128,8,4,power_law_1.2,0.11651840209960937
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,4096,1536,8,128,16,2,balanced,0.07111466427644093
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,4096,1536,8,128,8,4,power_law_1.2,0.15251840353012086
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,4096,1536,8,128,16,2,balanced,0.18794665733973184
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,4096,1536,8,128,8,4,power_law_1.2,0.17984000444412232
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,4096,1536,8,128,16,2,balanced,0.07348266740640004
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,4096,1536,8,128,16,2,balanced,0.07401599983374278
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,4096,1536,8,128,8,4,power_law_1.2,0.243340802192688
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,4096,1536,8,128,16,2,balanced,0.25733333826065063
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,4096,1536,8,128,16,2,balanced,0.07478400071461995
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,4096,1536,8,128,8,4,power_law_1.2,0.31449599266052247
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,4096,1536,8,128,16,2,balanced,0.07638933261235555
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,4096,1536,8,128,8,4,power_law_1.2,0.4574848175048828
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,4096,1536,8,128,16,2,balanced,0.07870399951934814
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,4096,1536,8,128,16,2,balanced,0.33189332485198975
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,4096,1536,8,128,8,4,power_law_1.2,0.5452288150787353
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,4096,1536,8,128,16,2,balanced,0.08262399832407634
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,4096,1536,8,128,8,4,power_law_1.2,0.8298815727233887
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,4096,1536,8,128,16,2,balanced,0.09111467003822327
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,4096,1536,8,128,8,4,power_law_1.2,1.192255973815918
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,4096,1536,8,128,16,2,balanced,0.09499733646710713
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,4096,1536,8,128,16,2,balanced,0.5163679917653402
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,4096,1536,8,128,8,4,power_law_1.2,1.9074880599975585
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,4096,1536,8,128,16,2,power_law_1.01,0.042368000745773314
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,4096,1536,8,128,16,2,balanced,0.10618666807810466
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,4096,1536,8,128,8,4,power_law_1.2,2.207596778869629
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,4096,1536,8,128,16,2,power_law_1.01,0.0414463996887207
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,4096,1536,8,128,8,4,power_law_1.2,3.5081214904785156
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,4096,1536,8,128,16,2,balanced,0.1193386713663737
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,4096,1536,8,128,16,2,power_law_1.01,0.04088320136070252
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,4096,1536,8,128,8,4,power_law_1.2,4.625836944580078
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,4096,1536,8,128,16,2,balanced,0.13392000397046408
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,4096,1536,8,128,16,2,balanced,0.6879893143971761
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,4096,1536,8,128,16,2,power_law_1.01,0.05129600167274475
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,4096,1536,8,128,8,4,power_law_1.2,9.970636749267578
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,4096,1536,8,128,16,2,power_law_1.01,0.05809919834136963
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,4096,1536,8,128,16,2,balanced,0.16075199842453003
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,4096,1536,8,128,16,2,power_law_1.01,0.07612159848213196
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,4096,1536,8,128,16,2,balanced,0.1879146695137024
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,4096,1536,8,128,16,2,power_law_1.01,0.07902719974517822
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,4096,1536,8,128,16,2,power_law_1.01,0.07759360074996949
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,4096,1536,8,128,16,2,power_law_1.01,0.08258559703826904
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,4096,1536,8,128,16,2,balanced,0.2685760060946147
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,4096,1536,8,128,16,2,balanced,1.0200106302897136
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,4096,1536,8,128,16,2,power_law_1.01,0.08431360125541687
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,4096,1536,8,128,16,2,power_law_1.01,0.09197440147399902
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,4096,1536,8,128,16,2,balanced,0.3319999972979228
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,4096,1536,8,128,16,2,power_law_1.01,0.09676799774169922
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,4096,1536,8,128,16,2,power_law_1.01,0.10721280574798583
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,4096,1536,8,128,16,2,power_law_1.01,0.11100159883499146
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,4096,1536,8,128,16,2,power_law_1.01,0.12015999555587768
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,4096,1536,8,128,16,2,balanced,0.5071733395258585
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,4096,1536,8,128,16,2,power_law_1.01,0.1278720021247864
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,4096,1536,8,128,16,2,balanced,1.3636587460835774
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,4096,1536,8,128,16,2,power_law_1.01,0.12186880111694336
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,4096,1536,8,128,16,2,power_law_1.01,0.15968639850616456
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,4096,1536,8,128,16,2,power_law_1.01,0.195961594581604
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,4096,1536,8,128,16,2,balanced,0.6776959896087646
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,4096,1536,8,128,16,2,power_law_1.01,0.22174720764160155
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,4096,1536,8,128,16,2,power_law_1.01,0.26236801147460936
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,4096,1536,8,128,16,2,power_law_1.01,0.3205888032913208
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,4096,1536,8,128,16,2,power_law_1.01,0.4126016139984131
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,4096,1536,8,128,16,2,power_law_1.01,0.5681663990020752
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,4096,1536,8,128,16,2,power_law_1.01,0.684716796875
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,4096,1536,8,128,16,2,balanced,1.0152640342712402
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,4096,1536,8,128,16,2,power_law_1.01,0.03454079926013946
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,4096,1536,8,128,16,2,balanced,1.707274595896403
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,4096,1536,8,128,16,2,power_law_1.01,1.0714688301086426
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,4096,1536,8,128,16,2,power_law_1.01,0.03580160140991211
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,4096,1536,8,128,16,2,power_law_1.01,1.41463041305542
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,4096,1536,8,128,16,2,power_law_1.01,0.03743999898433685
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,4096,1536,8,128,16,2,power_law_1.01,0.04471679925918579
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,4096,1536,8,128,16,2,power_law_1.01,1.811180877685547
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,4096,1536,8,128,16,2,power_law_1.01,0.048844799399375916
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,4096,1536,8,128,16,2,power_law_1.01,0.06317440271377564
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,4096,1536,8,128,16,2,power_law_1.01,2.76440315246582
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,4096,1536,8,128,16,2,power_law_1.01,0.06516479849815368
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,4096,1536,8,128,16,2,power_law_1.01,0.06888319849967957
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,4096,1536,8,128,16,2,balanced,1.286240021387736
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,4096,1536,8,128,16,2,power_law_1.01,6.294918441772461
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,4096,1536,8,128,16,2,power_law_1.01,0.07092480063438415
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,4096,1536,8,128,16,2,power_law_1.01,0.07619839906692505
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,4096,1536,8,128,16,2,power_law_1.01,0.0789247989654541
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,4096,1536,8,128,16,2,power_law_1.01,0.0840511977672577
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,4096,1536,8,128,16,2,power_law_1.01,0.09048960208892823
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,4096,1536,8,128,16,2,power_law_1.01,0.09281920194625855
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,4096,1536,8,128,16,2,power_law_1.01,0.10156160593032837
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,4096,1536,8,128,16,2,balanced,2.5050719579060874
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,4096,1536,8,128,16,2,power_law_1.01,0.1074944019317627
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,4096,1536,8,128,16,2,power_law_1.01,0.1192639946937561
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,4096,1536,8,128,16,2,balanced,1.6191627184549968
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,4096,1536,8,128,16,2,power_law_1.01,0.13521920442581176
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,4096,1536,8,128,16,2,power_law_1.01,0.1602944016456604
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,4096,1536,8,128,16,2,power_law_1.01,0.1922943949699402
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,4096,1536,8,128,16,2,power_law_1.01,0.23991680145263672
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,4096,1536,8,128,16,2,power_law_1.01,0.30643200874328613
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,4096,1536,8,128,16,2,power_law_1.2,0.04216960072517395
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,4096,1536,8,128,16,2,power_law_1.01,0.39228799343109133
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,4096,1536,8,128,16,2,power_law_1.2,0.039647999405860904
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,4096,1536,8,128,16,2,power_law_1.01,0.5723775863647461
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,4096,1536,8,128,16,2,power_law_1.2,0.04195840060710907
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,4096,1536,8,128,16,2,power_law_1.01,0.6974912166595459
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,4096,1536,8,128,16,2,power_law_1.2,0.050496000051498416
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,4096,1536,8,128,16,2,power_law_1.01,1.0215871810913086
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,4096,1536,8,128,16,2,power_law_1.2,0.05788800120353699
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,4096,1536,8,128,16,2,power_law_1.01,1.404415988922119
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,4096,1536,8,128,16,2,power_law_1.2,0.07479040026664734
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,4096,1536,8,128,16,2,power_law_1.01,1.6885759353637695
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,4096,1536,8,128,16,2,power_law_1.2,0.07793920040130616
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,4096,1536,8,128,16,2,power_law_1.2,0.08145279884338379
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,4096,1536,8,128,16,2,power_law_1.01,2.834137535095215
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,4096,1536,8,128,16,2,balanced,2.5401600201924643
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,4096,1536,8,128,16,2,power_law_1.2,0.08484479784965515
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,4096,1536,8,128,16,2,power_law_1.01,5.694918441772461
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,4096,1536,8,128,16,2,power_law_1.2,0.08615679740905761
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,4096,1536,8,128,16,2,power_law_1.2,0.09657599925994872
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,4096,1536,8,128,16,2,power_law_1.2,0.10206719636917114
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,4096,1536,8,128,16,2,power_law_1.2,0.10996479988098144
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,4096,1536,8,128,16,2,power_law_1.2,0.11127040386199952
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,4096,1536,8,128,16,2,power_law_1.2,0.11928319931030273
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,4096,1536,8,128,16,2,power_law_1.2,0.12770559787750244
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,4096,1536,8,128,16,2,balanced,4.963210741678874
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,4096,1536,8,128,16,2,power_law_1.2,0.12626559734344484
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,4096,1536,8,128,16,2,power_law_1.2,0.16963839530944824
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,4096,1536,8,128,16,2,power_law_1.2,0.20142080783843994
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,4096,1536,8,128,16,2,power_law_1.2,0.22775039672851563
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,4096,1536,8,128,16,2,power_law_1.2,0.2620352029800415
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,4096,1536,8,128,16,2,power_law_1.2,0.30933759212493894
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,4096,1536,8,128,16,2,power_law_1.2,0.4295040130615234
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,4096,1536,8,128,16,2,power_law_1.2,0.5938623905181885
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,4096,1536,8,128,16,2,power_law_1.2,0.8059647560119629
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,4096,1536,8,128,16,2,power_law_1.2,1.1347328186035157
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,4096,1536,8,128,16,2,power_law_1.2,1.561350440979004
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,4096,1536,8,128,16,2,power_law_1.2,1.943212890625
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,4096,1536,8,128,16,2,power_law_1.2,3.1557247161865236
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,4096,1536,8,128,16,2,balanced,5.012293179829915
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,4096,1536,8,128,16,2,power_law_1.2,0.03432320058345795
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,4096,1536,8,128,16,2,power_law_1.2,6.682669067382813
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,4096,1536,8,128,16,2,power_law_1.2,0.03480960130691528
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,4096,1536,8,128,16,2,power_law_1.2,0.03824639916419983
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,4096,1536,8,128,16,2,power_law_1.2,0.04469760060310364
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,4096,1536,8,128,16,2,power_law_1.2,0.048390400409698484
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,4096,1536,8,128,16,2,power_law_1.2,0.06435840129852295
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,4096,1536,8,128,16,2,power_law_1.2,0.06616320013999939
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,4096,1536,8,128,16,2,power_law_1.2,0.06917759776115417
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,4096,1536,8,128,16,2,power_law_1.2,0.07431039810180665
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,4096,1536,8,128,16,2,power_law_1.2,0.07976319789886474
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,4096,1536,8,128,16,2,power_law_1.2,0.08057600259780884
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,4096,1536,8,128,16,2,power_law_1.2,0.09114879965782166
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,4096,1536,8,128,16,2,power_law_1.2,0.0931007981300354
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,4096,1536,8,128,16,2,power_law_1.2,0.09503999948501587
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,4096,1536,8,128,16,2,power_law_1.2,0.1043776035308838
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,4096,1536,8,128,16,2,power_law_1.2,0.10828160047531128
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,4096,1536,8,128,16,2,power_law_1.2,0.12228480577468873
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,4096,1536,8,128,16,2,power_law_1.2,0.1407807946205139
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,4096,1536,8,128,16,2,power_law_1.2,0.16082559823989867
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,4096,1536,8,128,16,2,power_law_1.2,0.1965440034866333
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,4096,1536,8,128,16,2,power_law_1.2,0.24261760711669922
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,4096,1536,8,128,16,2,power_law_1.2,0.31702399253845215
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,4096,1536,8,128,16,2,power_law_1.2,0.4189631938934326
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,4096,1536,8,128,16,2,power_law_1.2,0.5853439807891846
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,4096,1536,8,128,16,2,power_law_1.2,0.7668416023254394
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,4096,1536,8,128,16,2,power_law_1.2,1.1660672187805177
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,4096,1536,8,128,16,2,power_law_1.2,1.620262336730957
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,4096,1536,8,128,16,2,power_law_1.2,1.936729621887207
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,4096,1536,8,128,16,2,power_law_1.2,3.3936641693115233
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,4096,1536,8,128,16,2,power_law_1.2,7.144461059570313
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,4096,1536,8,128,32,1,balanced,0.03953066716591517
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,4096,1536,8,128,32,1,balanced,0.04660266637802124
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,4096,1536,8,128,32,1,balanced,0.053930665055910744
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,4096,1536,8,128,32,1,balanced,0.07365866502126057
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,4096,1536,8,128,32,1,balanced,0.10018666585286458
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,4096,1536,8,128,32,1,balanced,0.10400000214576721
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,4096,1536,8,128,32,1,balanced,0.10325866937637329
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,4096,1536,8,128,32,1,balanced,0.10473066568374634
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,4096,1536,8,128,32,1,balanced,0.10575466354688008
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,4096,1536,8,128,32,1,balanced,0.10785599549611409
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,4096,1536,8,128,32,1,balanced,0.11083199580510457
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,4096,1536,8,128,32,1,balanced,0.11440533399581909
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,4096,1536,8,128,32,1,balanced,0.11750400066375732
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,4096,1536,8,128,32,1,balanced,0.121370663245519
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,4096,1536,8,128,32,1,balanced,0.1281013290087382
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,4096,1536,8,128,32,1,balanced,0.13296533624331155
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,4096,1536,8,128,32,1,balanced,0.15203733245531717
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,4096,1536,8,128,32,1,balanced,0.18081067005793253
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,4096,1536,8,128,32,1,balanced,0.19917333126068115
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,4096,1536,8,128,32,1,balanced,0.239519993464152
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,4096,1536,8,128,32,1,balanced,0.2725600004196167
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,4096,1536,8,128,32,1,balanced,0.03716266651948293
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,4096,1536,8,128,32,1,balanced,0.41993598143259686
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,4096,1536,8,128,32,1,balanced,0.041834667325019836
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,4096,1536,8,128,32,1,balanced,0.04729066789150238
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,4096,1536,8,128,32,1,balanced,0.06473066906134288
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,4096,1536,8,128,32,1,balanced,0.09449066718419392
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,4096,1536,8,128,32,1,balanced,0.4901920159657796
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,4096,1536,8,128,32,1,balanced,0.09656000137329102
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,4096,1536,8,128,32,1,balanced,0.09614400068918864
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,4096,1536,8,128,32,1,balanced,0.09864532947540283
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,4096,1536,8,128,32,1,balanced,0.10070932904879253
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,4096,1536,8,128,32,1,balanced,0.10388267040252686
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,4096,1536,8,128,32,1,balanced,0.7714613278706869
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,4096,1536,8,128,32,1,power_law_1.01,0.038022398948669434
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,4096,1536,8,128,32,1,balanced,0.10363200306892395
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,4096,1536,8,128,32,1,power_law_1.01,0.04009599983692169
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,4096,1536,8,128,32,1,balanced,0.10591999689737956
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,4096,1536,8,128,32,1,power_law_1.01,0.05057280063629151
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,4096,1536,8,128,32,1,balanced,0.11060800155003865
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,4096,1536,8,128,32,1,balanced,0.11787733435630798
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,4096,1536,8,128,32,1,power_law_1.01,0.06162559986114502
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,4096,1536,8,128,32,1,balanced,1.0743199984232585
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,4096,1536,8,128,32,1,balanced,0.12999999523162842
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,4096,1536,8,128,32,1,power_law_1.01,0.07077760100364686
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,4096,1536,8,128,32,1,power_law_1.01,0.08959360122680664
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,4096,1536,8,128,32,1,balanced,0.13733333349227905
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,4096,1536,8,128,32,1,power_law_1.01,0.09710720181465149
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,4096,1536,8,128,32,1,balanced,0.16160533825556436
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,4096,1536,8,128,32,1,power_law_1.01,0.09758719801902771
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,4096,1536,8,128,32,1,balanced,0.1911146640777588
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,4096,1536,8,128,32,1,power_law_1.01,0.10126719474792481
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,4096,1536,8,128,32,1,balanced,1.6237120628356934
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,4096,1536,8,128,32,1,power_law_1.01,0.10625920295715333
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,4096,1536,8,128,32,1,balanced,0.20451200008392334
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,4096,1536,8,128,32,1,power_law_1.01,0.11456639766693115
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,4096,1536,8,128,32,1,balanced,0.2554933428764343
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,4096,1536,8,128,32,1,power_law_1.01,0.12145919799804687
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,4096,1536,8,128,32,1,power_law_1.01,0.12647680044174195
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,4096,1536,8,128,32,1,balanced,0.2995893359184265
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,4096,1536,8,128,32,1,power_law_1.01,0.12655999660491943
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,4096,1536,8,128,32,1,power_law_1.01,0.13755520582199096
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,4096,1536,8,128,32,1,power_law_1.01,0.035206401348114015
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,4096,1536,8,128,32,1,power_law_1.01,0.14472960233688353
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,4096,1536,8,128,32,1,balanced,0.4486080010732015
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,4096,1536,8,128,32,1,power_law_1.01,0.0384768009185791
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,4096,1536,8,128,32,1,power_law_1.01,0.1604416012763977
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,4096,1536,8,128,32,1,power_law_1.01,0.046374401450157164
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,4096,1536,8,128,32,1,balanced,2.0563999811808267
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,4096,1536,8,128,32,1,power_law_1.01,0.21531519889831544
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,4096,1536,8,128,32,1,power_law_1.01,0.057030397653579715
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,4096,1536,8,128,32,1,balanced,0.5615839958190918
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,4096,1536,8,128,32,1,power_law_1.01,0.2177664041519165
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,4096,1536,8,128,32,1,power_law_1.01,0.0615231990814209
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,4096,1536,8,128,32,1,power_law_1.01,0.2888319969177246
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,4096,1536,8,128,32,1,power_law_1.01,0.0847104012966156
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,4096,1536,8,128,32,1,power_law_1.01,0.33588480949401855
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,4096,1536,8,128,32,1,power_law_1.01,0.08819839954376221
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,4096,1536,8,128,32,1,power_law_1.01,0.43576960563659667
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,4096,1536,8,128,32,1,balanced,0.840399980545044
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,4096,1536,8,128,32,1,power_law_1.01,0.09242879748344421
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,4096,1536,8,128,32,1,power_law_1.01,0.5459328174591065
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,4096,1536,8,128,32,1,power_law_1.01,0.09703680276870727
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,4096,1536,8,128,32,1,power_law_1.01,0.09952639937400817
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,4096,1536,8,128,32,1,power_law_1.01,0.7775487899780273
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,4096,1536,8,128,32,1,power_law_1.01,0.11025279760360718
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,4096,1536,8,128,32,1,power_law_1.01,1.0185536384582519
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,4096,1536,8,128,32,1,power_law_1.01,0.11976959705352783
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,4096,1536,8,128,32,1,balanced,1.1874879995981853
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,4096,1536,8,128,32,1,balanced,2.575690587361654
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,4096,1536,8,128,32,1,power_law_1.01,1.5328000068664551
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,4096,1536,8,128,32,1,power_law_1.01,0.1263167977333069
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,4096,1536,8,128,32,1,power_law_1.01,0.13096319437026976
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,4096,1536,8,128,32,1,power_law_1.01,2.0060224533081055
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,4096,1536,8,128,32,1,power_law_1.01,0.14332159757614135
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,4096,1536,8,128,32,1,power_law_1.01,2.483955192565918
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,4096,1536,8,128,32,1,power_law_1.01,0.15649919509887694
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,4096,1536,8,128,32,1,power_law_1.01,0.17938560247421265
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,4096,1536,8,128,32,1,power_law_1.01,3.9797569274902345
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,4096,1536,8,128,32,1,power_law_1.01,0.2148224115371704
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,4096,1536,8,128,32,1,power_law_1.01,0.2358016014099121
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,4096,1536,8,128,32,1,balanced,1.827781359354655
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,4096,1536,8,128,32,1,power_law_1.01,0.29240319728851316
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,4096,1536,8,128,32,1,power_law_1.01,8.556224060058593
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,4096,1536,8,128,32,1,power_law_1.01,0.36231040954589844
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,4096,1536,8,128,32,1,power_law_1.01,0.48930559158325193
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,4096,1536,8,128,32,1,power_law_1.01,0.608896017074585
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,4096,1536,8,128,32,1,power_law_1.01,0.86561279296875
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,4096,1536,8,128,32,1,power_law_1.01,1.1470784187316894
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,4096,1536,8,128,32,1,balanced,2.443589369455973
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,4096,1536,8,128,32,1,power_law_1.01,1.7264127731323242
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,4096,1536,8,128,32,1,balanced,4.008261362711589
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,4096,1536,8,128,32,1,power_law_1.2,0.038124799728393555
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,4096,1536,8,128,32,1,power_law_1.01,2.282111930847168
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,4096,1536,8,128,32,1,power_law_1.2,0.04188160002231598
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,4096,1536,8,128,32,1,power_law_1.01,2.861139106750488
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,4096,1536,8,128,32,1,power_law_1.2,0.049344000220298764
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,4096,1536,8,128,32,1,power_law_1.01,4.463577651977539
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,4096,1536,8,128,32,1,power_law_1.2,0.060153597593307497
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,4096,1536,8,128,32,1,power_law_1.2,0.03521920144557953
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,4096,1536,8,128,32,1,power_law_1.2,0.0679423987865448
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,4096,1536,8,128,32,1,power_law_1.01,9.425811004638671
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,4096,1536,8,128,32,1,power_law_1.2,0.08949120044708252
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,4096,1536,8,128,32,1,power_law_1.2,0.09742079973220825
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,4096,1536,8,128,32,1,power_law_1.2,0.03850879967212677
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,4096,1536,8,128,32,1,power_law_1.2,0.043756800889968875
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,4096,1536,8,128,32,1,power_law_1.2,0.09941120147705078
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,4096,1536,8,128,32,1,balanced,3.0678399403889975
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,4096,1536,8,128,32,1,power_law_1.2,0.05295360088348389
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,4096,1536,8,128,32,1,power_law_1.2,0.10374399423599243
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,4096,1536,8,128,32,1,power_law_1.2,0.10808320045471191
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,4096,1536,8,128,32,1,power_law_1.2,0.05986559987068176
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,4096,1536,8,128,32,1,power_law_1.2,0.11653120517730713
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,4096,1536,8,128,32,1,power_law_1.2,0.0844543993473053
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,4096,1536,8,128,32,1,power_law_1.2,0.12446080446243286
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,4096,1536,8,128,32,1,power_law_1.2,0.1290176033973694
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,4096,1536,8,128,32,1,power_law_1.2,0.08992639780044556
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,4096,1536,8,128,32,1,power_law_1.2,0.12760319709777831
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,4096,1536,8,128,32,1,power_law_1.2,0.09539200067520141
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,4096,1536,8,128,32,1,power_law_1.2,0.13939199447631836
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,4096,1536,8,128,32,1,power_law_1.2,0.14620159864425658
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,4096,1536,8,128,32,1,power_law_1.2,0.10071040391921997
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,4096,1536,8,128,32,1,power_law_1.2,0.16293760538101196
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,4096,1536,8,128,32,1,power_law_1.2,0.10378880500793457
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,4096,1536,8,128,32,1,power_law_1.2,0.21779839992523192
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,4096,1536,8,128,32,1,power_law_1.2,0.11399040222167969
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,4096,1536,8,128,32,1,power_law_1.2,0.2203968048095703
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,4096,1536,8,128,32,1,power_law_1.2,0.12090239524841309
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,4096,1536,8,128,32,1,power_law_1.2,0.28933761119842527
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,4096,1536,8,128,32,1,power_law_1.2,0.12713600397109986
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,4096,1536,8,128,32,1,balanced,4.6062774658203125
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,4096,1536,8,128,32,1,power_law_1.2,0.13367040157318116
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,4096,1536,8,128,32,1,power_law_1.2,0.3386944055557251
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,4096,1536,8,128,32,1,power_law_1.2,0.14551039934158325
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,4096,1536,8,128,32,1,power_law_1.2,0.4374720096588135
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,4096,1536,8,128,32,1,power_law_1.2,0.15863679647445678
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,4096,1536,8,128,32,1,power_law_1.2,0.5481984138488769
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,4096,1536,8,128,32,1,power_law_1.2,0.1824512004852295
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,4096,1536,8,128,32,1,power_law_1.2,0.7836031913757324
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,4096,1536,8,128,32,1,power_law_1.2,0.21692159175872802
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,4096,1536,8,128,32,1,power_law_1.2,0.23955199718475342
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,4096,1536,8,128,32,1,power_law_1.2,1.032921600341797
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,4096,1536,8,128,32,1,balanced,8.412960052490234
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,4096,1536,8,128,32,1,power_law_1.2,0.29244160652160645
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,4096,1536,8,128,32,1,power_law_1.2,1.5389056205749512
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,4096,1536,8,128,32,1,power_law_1.2,0.36584959030151365
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,4096,1536,8,128,32,1,power_law_1.2,2.0380992889404297
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,4096,1536,8,128,32,1,power_law_1.2,0.49324798583984375
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,4096,1536,8,128,32,1,power_law_1.2,0.6113855838775635
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,4096,1536,8,128,32,1,power_law_1.2,2.5357696533203127
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,4096,1536,8,128,32,1,power_law_1.2,0.8684032440185547
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,4096,1536,8,128,32,1,power_law_1.2,4.167340850830078
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,4096,1536,8,128,32,1,power_law_1.2,1.1571776390075683
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,4096,1536,8,128,32,1,power_law_1.2,1.7386751174926758
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,4096,1536,8,128,32,1,power_law_1.2,8.63232650756836
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,4096,1536,8,128,32,1,power_law_1.2,2.31790714263916
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,4096,1536,8,128,32,1,power_law_1.2,2.8879487991333006
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,4096,1536,8,128,32,1,power_law_1.2,4.658950424194336
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,4096,1536,8,128,32,1,power_law_1.2,9.628217315673828
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,4096,1536,8,128,32,1,balanced,9.130117416381836
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,6144,2560,8,160,1,32,balanced,0.07486400008201599
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,6144,2560,8,160,1,32,balanced,0.05618133147557577
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,6144,2560,8,160,1,32,balanced,0.07041066884994507
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,6144,2560,8,160,1,32,balanced,0.053301334381103516
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,6144,2560,8,160,1,32,balanced,0.07035199801127116
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,6144,2560,8,160,1,32,balanced,0.05314666529496511
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,6144,2560,8,160,1,32,balanced,0.09151466687520345
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,6144,2560,8,160,1,32,balanced,0.07089599967002869
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,6144,2560,8,160,1,32,balanced,0.0950986643632253
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,6144,2560,8,160,1,32,balanced,0.1285760005315145
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,6144,2560,8,160,1,32,balanced,0.10354133447011311
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,6144,2560,8,160,1,32,balanced,0.14892266194025675
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,6144,2560,8,160,1,32,balanced,0.10445333520571391
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,6144,2560,8,160,1,32,balanced,0.15335466464360556
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,6144,2560,8,160,1,32,balanced,0.10548800230026245
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,6144,2560,8,160,1,32,balanced,0.15361066659291586
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,6144,2560,8,160,1,32,balanced,0.10599467158317566
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,6144,2560,8,160,1,32,balanced,0.15544533729553223
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,6144,2560,8,160,1,32,balanced,0.10659733414649963
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,6144,2560,8,160,1,32,balanced,0.15431466698646545
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,6144,2560,8,160,1,32,balanced,0.10876267155011494
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,6144,2560,8,160,1,32,balanced,0.15666133165359497
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,6144,2560,8,160,1,32,balanced,0.10883200168609619
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,6144,2560,8,160,1,32,balanced,0.15690132975578308
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,6144,2560,8,160,1,32,balanced,0.1111253301302592
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,6144,2560,8,160,1,32,balanced,0.1590559979279836
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,6144,2560,8,160,1,32,balanced,0.11416533589363098
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,6144,2560,8,160,1,32,balanced,0.1591200033823649
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,6144,2560,8,160,1,32,balanced,0.1181066632270813
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,6144,2560,8,160,1,32,balanced,0.16053332885106406
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,6144,2560,8,160,1,32,balanced,0.12025599678357442
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,6144,2560,8,160,1,32,balanced,0.1744746764500936
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,6144,2560,8,160,1,32,balanced,0.1236799955368042
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,6144,2560,8,160,1,32,balanced,0.17190400759379068
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,6144,2560,8,160,1,32,balanced,0.14924266934394836
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,6144,2560,8,160,1,32,balanced,0.04964800179004669
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,6144,2560,8,160,1,32,balanced,0.22775999704996744
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,6144,2560,8,160,1,32,balanced,0.14271466930707297
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,6144,2560,8,160,1,32,balanced,0.04894400139649709
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,6144,2560,8,160,1,32,balanced,0.18354666233062744
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,6144,2560,8,160,1,32,balanced,0.18130133549372354
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,6144,2560,8,160,1,32,balanced,0.050341332952181496
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,6144,2560,8,160,1,32,balanced,0.06818666557470958
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,6144,2560,8,160,1,32,balanced,0.2552693287531535
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,6144,2560,8,160,1,32,balanced,0.09515733520189922
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,6144,2560,8,160,1,32,balanced,0.17848533391952515
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,6144,2560,8,160,1,32,balanced,0.10010133186976115
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,6144,2560,8,160,1,32,balanced,0.1015786627928416
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,6144,2560,8,160,1,32,balanced,0.21611199776331583
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,6144,2560,8,160,1,32,balanced,0.10217600067456563
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,6144,2560,8,160,1,32,balanced,0.25035732984542847
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,6144,2560,8,160,1,32,balanced,0.10176533460617065
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,6144,2560,8,160,1,32,power_law_1.01,0.15943039655685426
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,6144,2560,8,160,1,32,balanced,0.10250666737556458
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,6144,2560,8,160,1,32,balanced,0.3362506628036499
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,6144,2560,8,160,1,32,balanced,0.10386133193969727
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,6144,2560,8,160,1,32,power_law_1.01,0.14453760385513306
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,6144,2560,8,160,1,32,balanced,0.10482666889826457
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,6144,2560,8,160,1,32,power_law_1.01,0.09786239862442017
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,6144,2560,8,160,1,32,balanced,0.1069493293762207
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,6144,2560,8,160,1,32,power_law_1.01,0.10562560558319092
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,6144,2560,8,160,1,32,balanced,0.2900213400522868
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,6144,2560,8,160,1,32,balanced,0.2637813289960225
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,6144,2560,8,160,1,32,power_law_1.01,0.12627840042114258
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,6144,2560,8,160,1,32,balanced,0.10777599612871806
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,6144,2560,8,160,1,32,power_law_1.01,0.14465919733047486
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,6144,2560,8,160,1,32,balanced,0.11269866426785786
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,6144,2560,8,160,1,32,power_law_1.01,0.15221760272979737
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,6144,2560,8,160,1,32,power_law_1.01,0.14916479587554932
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,6144,2560,8,160,1,32,power_law_1.01,0.15919359922409057
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,6144,2560,8,160,1,32,balanced,0.4851306676864624
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,6144,2560,8,160,1,32,balanced,0.40933334827423096
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,6144,2560,8,160,1,32,power_law_1.01,0.1515391945838928
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,6144,2560,8,160,1,32,power_law_1.01,0.165830397605896
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,6144,2560,8,160,1,32,power_law_1.01,0.10240639448165893
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,6144,2560,8,160,1,32,balanced,0.1165706713994344
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,6144,2560,8,160,1,32,power_law_1.01,0.18222719430923462
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,6144,2560,8,160,1,32,power_law_1.01,0.18510080575942994
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,6144,2560,8,160,1,32,power_law_1.01,0.09574400186538697
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,6144,2560,8,160,1,32,power_law_1.01,0.1770560026168823
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,6144,2560,8,160,1,32,balanced,0.5145119825998942
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,6144,2560,8,160,1,32,power_law_1.01,0.06442239880561829
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,6144,2560,8,160,1,32,power_law_1.01,0.22142720222473145
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,6144,2560,8,160,1,32,power_law_1.01,0.07678080201148987
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,6144,2560,8,160,1,32,balanced,0.452730655670166
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,6144,2560,8,160,1,32,power_law_1.01,0.231660795211792
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,6144,2560,8,160,1,32,power_law_1.01,0.08190079927444457
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,6144,2560,8,160,1,32,power_law_1.01,0.25199360847473146
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,6144,2560,8,160,1,32,balanced,0.11979200442632039
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,6144,2560,8,160,1,32,power_law_1.01,0.09745280146598816
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,6144,2560,8,160,1,32,power_law_1.01,0.34362881183624266
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,6144,2560,8,160,1,32,power_law_1.01,0.10021120309829712
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,6144,2560,8,160,1,32,power_law_1.01,0.2978111982345581
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,6144,2560,8,160,1,32,power_law_1.01,0.10090880393981934
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,6144,2560,8,160,1,32,power_law_1.01,0.38276479244232176
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,6144,2560,8,160,1,32,power_law_1.01,0.10444159507751465
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,6144,2560,8,160,1,32,power_law_1.01,0.4095295906066895
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,6144,2560,8,160,1,32,balanced,0.6297279993693033
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,6144,2560,8,160,1,32,power_law_1.01,0.52291841506958
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,6144,2560,8,160,1,32,power_law_1.01,0.11246720552444459
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,6144,2560,8,160,1,32,power_law_1.01,0.09673600196838379
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,6144,2560,8,160,1,32,power_law_1.01,0.6487679958343506
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,6144,2560,8,160,1,32,power_law_1.01,0.11446399688720703
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,6144,2560,8,160,1,32,balanced,0.658517320950826
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,6144,2560,8,160,1,32,power_law_1.01,0.982688045501709
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,6144,2560,8,160,1,32,power_law_1.01,0.11805440187454223
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,6144,2560,8,160,1,32,power_law_1.01,0.09463679790496826
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,6144,2560,8,160,1,32,balanced,0.13063466548919678
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,6144,2560,8,160,1,32,power_law_1.01,1.0459775924682617
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,6144,2560,8,160,1,32,power_law_1.01,0.1244096040725708
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,6144,2560,8,160,1,32,power_law_1.01,0.06336640119552613
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,6144,2560,8,160,1,32,power_law_1.01,1.4187968254089356
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,6144,2560,8,160,1,32,balanced,0.13911466797192892
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,6144,2560,8,160,1,32,power_law_1.01,0.12355200052261353
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,6144,2560,8,160,1,32,power_law_1.01,0.0884607970714569
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,6144,2560,8,160,1,32,power_law_1.01,1.930988883972168
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,6144,2560,8,160,1,32,power_law_1.2,0.15619839429855348
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,6144,2560,8,160,1,32,power_law_1.01,0.13319040536880494
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,6144,2560,8,160,1,32,power_law_1.01,0.08153600096702576
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,6144,2560,8,160,1,32,power_law_1.01,2.255615997314453
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,6144,2560,8,160,1,32,power_law_1.01,0.13976320028305053
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,6144,2560,8,160,1,32,power_law_1.2,0.11450879573822022
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,6144,2560,8,160,1,32,power_law_1.01,0.10080000162124633
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,6144,2560,8,160,1,32,balanced,0.8274933497111002
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,6144,2560,8,160,1,32,power_law_1.01,4.342924880981445
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,6144,2560,8,160,1,32,power_law_1.01,0.16556799411773682
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,6144,2560,8,160,1,32,power_law_1.2,0.0944320023059845
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,6144,2560,8,160,1,32,power_law_1.01,0.09787520170211791
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,6144,2560,8,160,1,32,power_law_1.01,0.20170879364013672
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,6144,2560,8,160,1,32,power_law_1.2,0.09539200067520141
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,6144,2560,8,160,1,32,power_law_1.01,0.09658880233764648
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,6144,2560,8,160,1,32,power_law_1.01,9.738674926757813
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,6144,2560,8,160,1,32,balanced,0.8069760004679362
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,6144,2560,8,160,1,32,power_law_1.01,0.2000256061553955
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,6144,2560,8,160,1,32,power_law_1.2,0.13230079412460327
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,6144,2560,8,160,1,32,power_law_1.01,0.10478719472885131
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,6144,2560,8,160,1,32,balanced,0.1583573321501414
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,6144,2560,8,160,1,32,power_law_1.01,0.23972480297088622
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,6144,2560,8,160,1,32,power_law_1.2,0.14833920001983641
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,6144,2560,8,160,1,32,power_law_1.01,0.11180800199508667
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,6144,2560,8,160,1,32,power_law_1.01,0.2703295946121216
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,6144,2560,8,160,1,32,power_law_1.2,0.14027520418167114
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,6144,2560,8,160,1,32,power_law_1.01,0.11963520050048829
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,6144,2560,8,160,1,32,balanced,0.17339199781417847
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,6144,2560,8,160,1,32,power_law_1.2,0.13903360366821288
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,6144,2560,8,160,1,32,power_law_1.01,0.3293247938156128
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,6144,2560,8,160,1,32,power_law_1.01,0.12050559520721435
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,6144,2560,8,160,1,32,power_law_1.2,0.15256320238113402
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,6144,2560,8,160,1,32,power_law_1.01,0.46102399826049806
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,6144,2560,8,160,1,32,power_law_1.01,0.13150080442428588
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,6144,2560,8,160,1,32,balanced,0.24207999308904013
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,6144,2560,8,160,1,32,balanced,0.9756106535593668
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,6144,2560,8,160,1,32,power_law_1.2,0.1622015953063965
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,6144,2560,8,160,1,32,power_law_1.01,0.601855993270874
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,6144,2560,8,160,1,32,power_law_1.01,0.13831039667129516
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,6144,2560,8,160,1,32,power_law_1.2,0.15430400371551514
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,6144,2560,8,160,1,32,power_law_1.01,0.15204479694366455
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,6144,2560,8,160,1,32,power_law_1.01,0.8260607719421387
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,6144,2560,8,160,1,32,balanced,0.2720639904340108
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,6144,2560,8,160,1,32,power_law_1.2,0.1945024013519287
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,6144,2560,8,160,1,32,power_law_1.01,1.1801152229309082
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,6144,2560,8,160,1,32,balanced,0.9625120162963867
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,6144,2560,8,160,1,32,power_law_1.2,0.20987520217895508
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,6144,2560,8,160,1,32,power_law_1.01,1.454854393005371
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,6144,2560,8,160,1,32,power_law_1.01,0.16240639686584474
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,6144,2560,8,160,1,32,power_law_1.2,0.2192768096923828
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,6144,2560,8,160,1,32,power_law_1.2,0.22570879459381105
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,6144,2560,8,160,1,32,power_law_1.01,1.7219583511352539
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,6144,2560,8,160,1,32,power_law_1.2,0.2853440046310425
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,6144,2560,8,160,1,32,power_law_1.01,0.17106560468673707
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,6144,2560,8,160,1,32,power_law_1.01,2.6988288879394533
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,6144,2560,8,160,1,32,power_law_1.2,0.27691519260406494
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,6144,2560,8,160,1,32,balanced,0.37415464719136554
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,6144,2560,8,160,1,32,power_law_1.2,0.41998720169067383
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,6144,2560,8,160,1,32,power_law_1.01,6.04189453125
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,6144,2560,8,160,1,32,power_law_1.2,0.3044608116149902
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,6144,2560,8,160,1,32,power_law_1.01,0.19625600576400756
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,6144,2560,8,160,1,32,power_law_1.2,0.4571839809417725
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,6144,2560,8,160,1,32,power_law_1.01,0.2221695899963379
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,6144,2560,8,160,1,32,power_law_1.2,0.46155519485473634
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,6144,2560,8,160,1,32,power_law_1.2,0.10491520166397095
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,6144,2560,8,160,1,32,power_law_1.2,0.6469823837280273
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,6144,2560,8,160,1,32,power_law_1.2,0.070387202501297
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,6144,2560,8,160,1,32,balanced,1.42905060450236
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,6144,2560,8,160,1,32,balanced,0.49026668071746826
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,6144,2560,8,160,1,32,power_law_1.01,0.2582207918167114
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,6144,2560,8,160,1,32,power_law_1.2,0.7851200103759766
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,6144,2560,8,160,1,32,power_law_1.2,0.06787840127944947
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,6144,2560,8,160,1,32,power_law_1.01,0.31623680591583253
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,6144,2560,8,160,1,32,power_law_1.2,0.9959487915039062
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,6144,2560,8,160,1,32,power_law_1.2,0.07533439993858337
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,6144,2560,8,160,1,32,power_law_1.01,0.5001023769378662
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,6144,2560,8,160,1,32,power_law_1.2,1.291654396057129
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,6144,2560,8,160,1,32,power_law_1.2,0.08279680013656616
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,6144,2560,8,160,1,32,balanced,1.4609546661376953
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,6144,2560,8,160,1,32,power_law_1.01,0.6192255973815918
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,6144,2560,8,160,1,32,power_law_1.2,0.09983360171318054
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,6144,2560,8,160,1,32,power_law_1.2,2.1650623321533202
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,6144,2560,8,160,1,32,power_law_1.2,0.1053056001663208
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,6144,2560,8,160,1,32,balanced,0.6851306756337484
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,6144,2560,8,160,1,32,power_law_1.2,3.223603057861328
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,6144,2560,8,160,1,32,power_law_1.01,0.8219648361206054
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,6144,2560,8,160,1,32,power_law_1.2,0.10551680326461792
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,6144,2560,8,160,1,32,power_law_1.2,0.11205120086669922
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,6144,2560,8,160,1,32,power_law_1.2,3.7097919464111326
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,6144,2560,8,160,1,32,power_law_1.01,1.1289919853210448
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,6144,2560,8,160,1,32,power_law_1.2,0.11214079856872558
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,6144,2560,8,160,1,32,power_law_1.2,0.12184959650039673
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,6144,2560,8,160,1,32,power_law_1.01,1.7608320236206054
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,6144,2560,8,160,1,32,power_law_1.2,7.170175933837891
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,6144,2560,8,160,1,32,power_law_1.2,0.12201600074768067
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,6144,2560,8,160,1,32,power_law_1.01,2.242464065551758
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,6144,2560,8,160,1,32,power_law_1.2,0.14060800075531005
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,6144,2560,8,160,1,32,power_law_1.2,13.501510620117188
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,6144,2560,8,160,1,32,power_law_1.2,0.12819839715957643
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,6144,2560,8,160,1,32,power_law_1.01,2.553887939453125
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,6144,2560,8,160,1,32,power_law_1.2,0.1430400013923645
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,6144,2560,8,160,1,32,balanced,0.8963253498077393
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,6144,2560,8,160,1,32,power_law_1.01,4.5943359375
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,6144,2560,8,160,1,32,power_law_1.2,0.15349760055541992
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,6144,2560,8,160,1,32,power_law_1.2,0.17386879920959472
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,6144,2560,8,160,1,32,power_law_1.01,8.392364501953125
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,6144,2560,8,160,1,32,power_law_1.2,0.22445440292358398
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,6144,2560,8,160,1,32,power_law_1.2,0.21479039192199706
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,6144,2560,8,160,1,32,power_law_1.2,0.27640318870544434
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,6144,2560,8,160,1,32,power_law_1.2,0.33045120239257814
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,6144,2560,8,160,1,32,power_law_1.2,0.43363199234008787
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,6144,2560,8,160,1,32,balanced,1.0892746448516846
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,6144,2560,8,160,1,32,power_law_1.2,0.5512639999389648
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,6144,2560,8,160,1,32,power_law_1.2,0.7644415855407715
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,6144,2560,8,160,1,32,power_law_1.2,1.023526382446289
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,6144,2560,8,160,1,32,balanced,2.8319946924845376
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,6144,2560,8,160,1,32,power_law_1.2,1.576364803314209
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,6144,2560,8,160,1,32,power_law_1.2,2.0194047927856444
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,6144,2560,8,160,1,32,power_law_1.2,2.423628807067871
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,6144,2560,8,160,1,32,balanced,2.893648147583008
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,6144,2560,8,160,1,32,power_law_1.2,3.6854270935058593
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,6144,2560,8,160,1,32,power_law_1.2,11.699072265625
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,6144,2560,8,160,1,32,balanced,1.7265226046244304
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,6144,2560,8,160,1,32,balanced,3.433722813924154
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,6144,2560,8,160,1,32,power_law_1.2,0.09664000272750854
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,6144,2560,8,160,1,32,power_law_1.2,0.06816639900207519
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,6144,2560,8,160,1,32,power_law_1.2,0.06655359864234925
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,6144,2560,8,160,1,32,power_law_1.2,0.07627519965171814
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,6144,2560,8,160,1,32,power_law_1.2,0.08086400032043457
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,6144,2560,8,160,1,32,power_law_1.2,0.09688320159912109
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,6144,2560,8,160,1,32,power_law_1.2,0.09444479942321778
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,6144,2560,8,160,1,32,power_law_1.2,0.09912319779396057
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,6144,2560,8,160,1,32,power_law_1.2,0.10467840433120727
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,6144,2560,8,160,1,32,power_law_1.2,0.11367039680480957
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,6144,2560,8,160,2,16,balanced,0.06509866813818614
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,6144,2560,8,160,1,32,power_law_1.2,0.11773439645767211
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,6144,2560,8,160,2,16,balanced,0.06361599763234456
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,6144,2560,8,160,1,32,power_law_1.2,0.12377599477767945
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,6144,2560,8,160,2,16,balanced,0.0632533331712087
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,6144,2560,8,160,2,16,balanced,0.08941866954167683
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,6144,2560,8,160,1,32,power_law_1.2,0.140665602684021
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,6144,2560,8,160,2,16,balanced,0.12737066547075906
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,6144,2560,8,160,1,32,power_law_1.2,0.14526720046997071
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,6144,2560,8,160,2,16,balanced,0.15289599696795145
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,6144,2560,8,160,1,32,power_law_1.2,0.1806656002998352
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,6144,2560,8,160,2,16,balanced,0.15744533141454062
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,6144,2560,8,160,2,16,balanced,0.15375999609629312
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,6144,2560,8,160,2,16,balanced,0.15474133690198263
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,6144,2560,8,160,1,32,power_law_1.2,0.16874239444732667
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,6144,2560,8,160,2,16,balanced,0.1553759972254435
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,6144,2560,8,160,2,16,balanced,0.15590399503707886
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,6144,2560,8,160,1,32,power_law_1.2,0.18670079708099366
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,6144,2560,8,160,2,16,balanced,0.1572480003039042
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,6144,2560,8,160,2,16,balanced,0.1586133340994517
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,6144,2560,8,160,2,16,balanced,0.16083199779192606
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,6144,2560,8,160,1,32,power_law_1.2,0.2151616096496582
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,6144,2560,8,160,2,16,balanced,0.16429866353670755
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,6144,2560,8,160,2,16,balanced,0.17196265856424967
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,6144,2560,8,160,1,32,power_law_1.2,0.25007359981536864
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,6144,2560,8,160,2,16,balanced,0.17223467429478964
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,6144,2560,8,160,2,16,balanced,0.23256532351175943
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,6144,2560,8,160,1,32,power_law_1.2,0.29429121017456056
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,6144,2560,8,160,2,16,balanced,0.18888000647226968
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,6144,2560,8,160,1,32,power_law_1.2,0.35438721179962157
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,6144,2560,8,160,1,32,power_law_1.2,0.597715187072754
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,6144,2560,8,160,2,16,balanced,0.26180267333984375
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,6144,2560,8,160,1,32,power_law_1.2,0.6977856159210205
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,6144,2560,8,160,2,16,balanced,0.21990400552749634
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,6144,2560,8,160,1,32,power_law_1.2,1.1407615661621093
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,6144,2560,8,160,2,16,balanced,0.05187733471393585
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,6144,2560,8,160,2,16,balanced,0.05298133194446564
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,6144,2560,8,160,2,16,balanced,0.3325120011965434
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,6144,2560,8,160,1,32,power_law_1.2,1.4543999671936034
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,6144,2560,8,160,2,16,balanced,0.05411200225353241
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,6144,2560,8,160,2,16,balanced,0.07012266914049785
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,6144,2560,8,160,1,32,power_law_1.2,2.057439994812012
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,6144,2560,8,160,2,16,balanced,0.09381866455078125
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,6144,2560,8,160,2,16,balanced,0.30671467383702594
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,6144,2560,8,160,1,32,power_law_1.2,3.3703872680664064
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,6144,2560,8,160,2,16,balanced,0.10254399975140889
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,6144,2560,8,160,2,16,balanced,0.1046346624692281
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,6144,2560,8,160,1,32,power_law_1.2,5.608480072021484
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,6144,2560,8,160,2,16,balanced,0.10541866223017375
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,6144,2560,8,160,2,16,balanced,0.04303466777006785
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,6144,2560,8,160,2,16,power_law_1.01,0.13317760229110717
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,6144,2560,8,160,2,16,balanced,0.1058026651541392
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,6144,2560,8,160,2,16,balanced,0.5027146736780802
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,6144,2560,8,160,1,32,power_law_1.2,6.469939422607422
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,6144,2560,8,160,2,16,balanced,0.04381333291530609
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,6144,2560,8,160,2,16,balanced,0.1067733367284139
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,6144,2560,8,160,2,16,power_law_1.01,0.1400320053100586
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,6144,2560,8,160,2,16,balanced,0.0487360010544459
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,6144,2560,8,160,2,16,balanced,0.10847999652226765
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,6144,2560,8,160,2,16,power_law_1.01,0.08766080141067505
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,6144,2560,8,160,2,16,balanced,0.06913599868615468
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,6144,2560,8,160,1,32,power_law_1.2,13.692684936523438
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,6144,2560,8,160,2,16,balanced,0.1093386709690094
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,6144,2560,8,160,2,16,power_law_1.01,0.0881663978099823
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,6144,2560,8,160,2,16,balanced,0.09493866562843323
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,6144,2560,8,160,2,16,balanced,0.5463200012842814
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,6144,2560,8,160,2,16,balanced,0.1111199955145518
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,6144,2560,8,160,2,16,power_law_1.01,0.1149183988571167
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,6144,2560,8,160,2,16,balanced,0.10111467043558757
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,6144,2560,8,160,2,16,balanced,0.11309333642323811
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,6144,2560,8,160,2,16,power_law_1.01,0.1434816002845764
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,6144,2560,8,160,2,16,balanced,0.1020906666914622
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,6144,2560,8,160,2,16,power_law_1.01,0.09855999946594238
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,6144,2560,8,160,2,16,power_law_1.01,0.1309183955192566
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,6144,2560,8,160,2,16,balanced,0.11753066380818684
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,6144,2560,8,160,2,16,balanced,0.10273067156473796
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,6144,2560,8,160,2,16,power_law_1.01,0.10051840543746948
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,6144,2560,8,160,2,16,power_law_1.01,0.13609600067138672
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,6144,2560,8,160,2,16,balanced,0.1206773320833842
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,6144,2560,8,160,2,16,balanced,0.10388799508412679
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,6144,2560,8,160,2,16,power_law_1.01,0.05861759781837463
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,6144,2560,8,160,2,16,power_law_1.01,0.14349440336227418
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,6144,2560,8,160,2,16,power_law_1.01,0.09475839734077454
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,6144,2560,8,160,2,16,balanced,0.10480533043543498
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,6144,2560,8,160,2,16,balanced,0.12450133760770161
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,6144,2560,8,160,2,16,power_law_1.01,0.07786239981651306
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,6144,2560,8,160,2,16,balanced,0.6632373332977295
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,6144,2560,8,160,2,16,power_law_1.01,0.1489856004714966
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,6144,2560,8,160,2,16,balanced,0.10647466778755188
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,6144,2560,8,160,2,16,power_law_1.01,0.095551997423172
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,6144,2560,8,160,2,16,balanced,0.15822933117548624
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,6144,2560,8,160,2,16,power_law_1.01,0.07871999740600585
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,6144,2560,8,160,2,16,power_law_1.01,0.15930240154266356
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,6144,2560,8,160,2,16,balanced,0.1065066655476888
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,6144,2560,8,160,2,16,power_law_1.01,0.052108800411224364
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,6144,2560,8,160,2,16,power_law_1.01,0.09658240079879761
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,6144,2560,8,160,2,16,balanced,0.1476959983507792
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,6144,2560,8,160,2,16,power_law_1.01,0.16026240587234497
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,6144,2560,8,160,2,16,balanced,0.10883733630180359
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,6144,2560,8,160,2,16,power_law_1.01,0.07516800165176392
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,6144,2560,8,160,2,16,power_law_1.01,0.09986559748649597
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,6144,2560,8,160,2,16,power_law_1.01,0.17159680128097535
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,6144,2560,8,160,2,16,balanced,0.11065066854159038
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,6144,2560,8,160,2,16,balanced,0.1912320057551066
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,6144,2560,8,160,2,16,power_law_1.01,0.07760639786720276
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,6144,2560,8,160,2,16,power_law_1.01,0.09918720126152039
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,6144,2560,8,160,2,16,power_law_1.01,0.17098239660263062
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,6144,2560,8,160,2,16,balanced,0.1156160036722819
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,6144,2560,8,160,2,16,power_law_1.01,0.09448959827423095
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,6144,2560,8,160,2,16,balanced,0.18770132462183634
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,6144,2560,8,160,2,16,power_law_1.01,0.10042239427566528
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,6144,2560,8,160,2,16,power_law_1.01,0.18206080198287963
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,6144,2560,8,160,2,16,power_law_1.01,0.09871360063552856
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,6144,2560,8,160,2,16,power_law_1.01,0.19751039743423462
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,6144,2560,8,160,2,16,balanced,0.8757173220316569
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,6144,2560,8,160,2,16,power_law_1.01,0.10554239749908448
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,6144,2560,8,160,2,16,power_law_1.01,0.1021183967590332
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,6144,2560,8,160,2,16,balanced,0.2600586613019307
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,6144,2560,8,160,2,16,power_law_1.01,0.10740480422973633
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,6144,2560,8,160,2,16,power_law_1.01,0.22371840476989746
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,6144,2560,8,160,2,16,power_law_1.01,0.10110080242156982
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,6144,2560,8,160,2,16,power_law_1.01,0.26477439403533937
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,6144,2560,8,160,2,16,balanced,0.11932800213495891
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,6144,2560,8,160,2,16,power_law_1.01,0.11256320476531982
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,6144,2560,8,160,2,16,power_law_1.01,0.10750720500946045
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,6144,2560,8,160,2,16,power_law_1.01,0.11362559795379638
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,6144,2560,8,160,2,16,power_law_1.01,0.2508415937423706
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,6144,2560,8,160,2,16,balanced,0.2781386574109395
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,6144,2560,8,160,2,16,power_law_1.01,0.1173248052597046
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,6144,2560,8,160,2,16,power_law_1.01,0.11425919532775879
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,6144,2560,8,160,2,16,power_law_1.01,0.32483839988708496
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,6144,2560,8,160,2,16,power_law_1.01,0.12314239740371705
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,6144,2560,8,160,2,16,power_law_1.01,0.12999680042266845
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,6144,2560,8,160,2,16,power_law_1.01,0.33045120239257814
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,6144,2560,8,160,2,16,power_law_1.01,0.12629120349884032
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,6144,2560,8,160,2,16,balanced,0.12583999832471213
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,6144,2560,8,160,2,16,power_law_1.01,0.136735999584198
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,6144,2560,8,160,2,16,power_law_1.01,0.1379583954811096
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,6144,2560,8,160,2,16,power_law_1.01,0.45939202308654786
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,6144,2560,8,160,2,16,balanced,0.4254080057144165
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,6144,2560,8,160,2,16,power_law_1.01,0.14775680303573607
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,6144,2560,8,160,2,16,power_law_1.01,0.15036159753799438
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,6144,2560,8,160,2,16,power_law_1.01,0.5370495796203614
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,6144,2560,8,160,2,16,balanced,1.03494397799174
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,6144,2560,8,160,2,16,power_law_1.01,0.1783679962158203
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,6144,2560,8,160,2,16,power_law_1.01,0.720198392868042
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,6144,2560,8,160,2,16,power_law_1.01,0.18732800483703613
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,6144,2560,8,160,2,16,power_law_1.01,0.14928640127182008
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,6144,2560,8,160,2,16,power_law_1.01,0.8662848472595215
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,6144,2560,8,160,2,16,balanced,0.49675198396046955
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,6144,2560,8,160,2,16,power_law_1.01,0.2290816068649292
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,6144,2560,8,160,2,16,power_law_1.01,1.2200703620910645
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,6144,2560,8,160,2,16,power_law_1.01,0.2544895887374878
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,6144,2560,8,160,2,16,power_law_1.01,0.16568319797515868
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,6144,2560,8,160,2,16,power_law_1.01,1.5663999557495116
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,6144,2560,8,160,2,16,balanced,0.14044800400733948
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,6144,2560,8,160,2,16,power_law_1.01,0.3287935972213745
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,6144,2560,8,160,2,16,power_law_1.01,2.0553407669067383
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,6144,2560,8,160,2,16,power_law_1.01,0.42926721572875975
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,6144,2560,8,160,2,16,balanced,0.15085867047309875
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,6144,2560,8,160,2,16,power_law_1.01,0.18889600038528442
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,6144,2560,8,160,2,16,power_law_1.2,0.13058559894561766
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,6144,2560,8,160,2,16,power_law_1.01,0.5436543941497802
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,6144,2560,8,160,2,16,power_law_1.01,3.09736328125
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,6144,2560,8,160,2,16,power_law_1.01,0.20848000049591064
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,6144,2560,8,160,2,16,balanced,0.6397226651509603
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,6144,2560,8,160,2,16,power_law_1.2,0.0791808009147644
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,6144,2560,8,160,2,16,power_law_1.01,0.7209216117858886
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,6144,2560,8,160,2,16,power_law_1.2,0.07543039917945862
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,6144,2560,8,160,2,16,power_law_1.01,7.792940521240235
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,6144,2560,8,160,2,16,power_law_1.01,1.020019245147705
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,6144,2560,8,160,2,16,power_law_1.2,0.09585919976234436
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,6144,2560,8,160,2,16,power_law_1.2,0.11047040224075318
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,6144,2560,8,160,2,16,power_law_1.01,1.1953408241271972
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,6144,2560,8,160,2,16,power_law_1.2,0.1318079948425293
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,6144,2560,8,160,2,16,power_law_1.2,0.14559999704360962
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,6144,2560,8,160,2,16,power_law_1.01,1.6526527404785156
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,6144,2560,8,160,2,16,power_law_1.2,0.1515071988105774
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,6144,2560,8,160,2,16,balanced,1.5521119435628254
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,6144,2560,8,160,2,16,balanced,0.1781866749127706
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,6144,2560,8,160,2,16,power_law_1.2,0.15427199602127076
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,6144,2560,8,160,2,16,power_law_1.01,0.27031679153442384
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,6144,2560,8,160,2,16,power_law_1.01,2.397235107421875
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,6144,2560,8,160,2,16,power_law_1.2,0.15345920324325563
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,6144,2560,8,160,2,16,power_law_1.01,0.3295423984527588
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,6144,2560,8,160,2,16,power_law_1.2,0.15599360466003417
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,6144,2560,8,160,2,16,balanced,0.1980266571044922
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,6144,2560,8,160,2,16,balanced,0.850810686747233
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,6144,2560,8,160,2,16,power_law_1.2,0.16787199974060057
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,6144,2560,8,160,2,16,power_law_1.01,5.735014343261719
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,6144,2560,8,160,2,16,power_law_1.01,0.44209918975830076
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,6144,2560,8,160,2,16,power_law_1.2,0.1715008020401001
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,6144,2560,8,160,2,16,power_law_1.01,0.5506624221801758
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,6144,2560,8,160,2,16,balanced,0.2797440091768901
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,6144,2560,8,160,2,16,power_law_1.2,0.1772223949432373
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,6144,2560,8,160,2,16,power_law_1.2,0.1982591986656189
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,6144,2560,8,160,2,16,power_law_1.2,0.19322880506515502
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,6144,2560,8,160,2,16,power_law_1.2,0.23681280612945557
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,6144,2560,8,160,2,16,balanced,0.3304640054702759
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,6144,2560,8,160,2,16,power_law_1.2,0.2930880069732666
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,6144,2560,8,160,2,16,power_law_1.01,0.7891583919525147
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,6144,2560,8,160,2,16,power_law_1.2,0.2856064081192017
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,6144,2560,8,160,2,16,power_law_1.2,0.36360960006713866
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,6144,2560,8,160,2,16,power_law_1.2,0.38814079761505127
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,6144,2560,8,160,2,16,power_law_1.2,0.5317440032958984
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,6144,2560,8,160,2,16,balanced,0.46322667598724365
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,6144,2560,8,160,2,16,power_law_1.01,1.105440044403076
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,6144,2560,8,160,2,16,power_law_1.2,0.5864511966705322
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,6144,2560,8,160,2,16,balanced,1.0265013376871746
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,6144,2560,8,160,2,16,power_law_1.2,0.8914752006530762
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,6144,2560,8,160,2,16,power_law_1.01,1.5423999786376954
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,6144,2560,8,160,2,16,power_law_1.2,1.2210240364074707
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,6144,2560,8,160,2,16,power_law_1.01,2.1541824340820312
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,6144,2560,8,160,2,16,power_law_1.2,1.8149503707885741
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,6144,2560,8,160,2,16,power_law_1.2,1.996895980834961
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,6144,2560,8,160,2,16,power_law_1.01,2.43753604888916
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,6144,2560,8,160,2,16,balanced,0.6011519829432169
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,6144,2560,8,160,2,16,power_law_1.2,3.0837631225585938
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,6144,2560,8,160,2,16,power_law_1.01,4.206598281860352
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,6144,2560,8,160,2,16,power_law_1.2,5.320409774780273
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,6144,2560,8,160,2,16,power_law_1.01,7.52258529663086
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,6144,2560,8,160,2,16,power_law_1.2,9.37957763671875
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,6144,2560,8,160,2,16,balanced,0.8378559748331705
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,6144,2560,8,160,2,16,balanced,1.5556480089823406
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,6144,2560,8,160,2,16,balanced,3.062272071838379
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,6144,2560,8,160,2,16,balanced,1.0944053332010906
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,6144,2560,8,160,2,16,balanced,1.3500800132751465
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,6144,2560,8,160,2,16,power_law_1.2,0.09557120203971863
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,6144,2560,8,160,2,16,power_law_1.2,0.05649920105934143
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,6144,2560,8,160,2,16,power_law_1.2,0.061791998147964475
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,6144,2560,8,160,2,16,power_law_1.2,0.07024639844894409
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,6144,2560,8,160,2,16,power_law_1.2,0.07659519910812378
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,6144,2560,8,160,2,16,power_law_1.2,0.09711359739303589
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,6144,2560,8,160,2,16,power_law_1.2,0.09883520007133484
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,6144,2560,8,160,2,16,power_law_1.2,0.10327680110931396
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,6144,2560,8,160,2,16,power_law_1.2,0.1057919979095459
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,6144,2560,8,160,2,16,power_law_1.2,0.10883840322494506
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,6144,2560,8,160,2,16,power_law_1.2,0.10871039628982544
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,6144,2560,8,160,2,16,power_law_1.2,0.1124608039855957
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,6144,2560,8,160,2,16,balanced,2.1290879249572754
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,6144,2560,8,160,2,16,balanced,3.0682827631632485
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,6144,2560,8,160,2,16,power_law_1.2,0.11982719898223877
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,6144,2560,8,160,2,16,power_law_1.2,0.12101759910583496
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,6144,2560,8,160,2,16,power_law_1.2,0.134060800075531
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,6144,2560,8,160,2,16,power_law_1.2,0.14499839544296264
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,6144,2560,8,160,2,16,power_law_1.2,0.1707327961921692
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,6144,2560,8,160,2,16,power_law_1.2,0.19869439601898192
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,6144,2560,8,160,2,16,power_law_1.2,0.1948799967765808
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,6144,2560,8,160,2,16,power_law_1.2,0.2574592113494873
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,6144,2560,8,160,2,16,power_law_1.2,0.29685120582580565
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,6144,2560,8,160,2,16,power_law_1.2,0.3558847904205322
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,6144,2560,8,160,2,16,power_law_1.2,0.48280959129333495
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,6144,2560,8,160,2,16,power_law_1.2,0.6503488063812256
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,6144,2560,8,160,2,16,power_law_1.2,0.9673279762268067
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,6144,2560,8,160,2,16,power_law_1.2,1.3227840423583985
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,6144,2560,8,160,2,16,power_law_1.2,1.7596288681030274
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,6144,2560,8,160,2,16,power_law_1.2,2.041753578186035
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,6144,2560,8,160,2,16,power_law_1.2,3.5852096557617186
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,6144,2560,8,160,2,16,power_law_1.2,7.849088287353515
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,6144,2560,8,160,2,16,balanced,4.236997286478679
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,6144,2560,8,160,2,16,power_law_1.2,0.09457280039787293
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,6144,2560,8,160,4,8,balanced,0.05522666871547699
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,6144,2560,8,160,2,16,power_law_1.2,0.05639680027961731
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,6144,2560,8,160,4,8,balanced,0.05579733351866404
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,6144,2560,8,160,2,16,power_law_1.2,0.05592319965362549
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,6144,2560,8,160,4,8,balanced,0.06392000118891399
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,6144,2560,8,160,2,16,power_law_1.2,0.07065600156784058
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,6144,2560,8,160,4,8,balanced,0.0897173285484314
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,6144,2560,8,160,2,16,power_law_1.2,0.07946239709854126
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,6144,2560,8,160,4,8,balanced,0.14666133125623068
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,6144,2560,8,160,2,16,power_law_1.2,0.0967296004295349
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,6144,2560,8,160,4,8,balanced,0.14968533317248026
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,6144,2560,8,160,2,16,power_law_1.2,0.09933440089225769
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,6144,2560,8,160,4,8,balanced,0.15757866700490317
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,6144,2560,8,160,2,16,power_law_1.2,0.10049279928207397
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,6144,2560,8,160,4,8,balanced,0.15607466300328574
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,6144,2560,8,160,4,8,balanced,0.1553439994653066
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,6144,2560,8,160,2,16,power_law_1.2,0.10413440465927123
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,6144,2560,8,160,4,8,balanced,0.1578879952430725
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,6144,2560,8,160,2,16,power_law_1.2,0.10434559583663941
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,6144,2560,8,160,4,8,balanced,0.1572053333123525
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,6144,2560,8,160,2,16,power_law_1.2,0.1214784026145935
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,6144,2560,8,160,4,8,balanced,0.1604106624921163
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,6144,2560,8,160,2,16,power_law_1.2,0.12386560440063477
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,6144,2560,8,160,4,8,balanced,0.16024532914161682
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,6144,2560,8,160,2,16,power_law_1.2,0.12811520099639892
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,6144,2560,8,160,4,8,balanced,0.16205333669980368
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,6144,2560,8,160,2,16,power_law_1.2,0.14829440116882325
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,6144,2560,8,160,4,8,balanced,0.047770669062932335
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,6144,2560,8,160,4,8,balanced,0.1671839952468872
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,6144,2560,8,160,2,16,power_law_1.2,0.16154240369796752
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,6144,2560,8,160,4,8,balanced,0.05060266455014547
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,6144,2560,8,160,4,8,balanced,0.18210132916768393
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,6144,2560,8,160,4,8,balanced,0.05299733579158783
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,6144,2560,8,160,4,8,balanced,0.0706826647122701
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,6144,2560,8,160,4,8,balanced,0.17751999696095785
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,6144,2560,8,160,4,8,balanced,0.09524266918500264
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,6144,2560,8,160,2,16,power_law_1.2,0.15289599895477296
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,6144,2560,8,160,4,8,balanced,0.2377600073814392
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,6144,2560,8,160,4,8,balanced,0.10533866286277771
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,6144,2560,8,160,4,8,balanced,0.10632000366846721
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,6144,2560,8,160,4,8,balanced,0.10706133643786113
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,6144,2560,8,160,4,8,balanced,0.2019466757774353
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,6144,2560,8,160,4,8,balanced,0.10829333464304607
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,6144,2560,8,160,2,16,power_law_1.2,0.18287359476089476
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,6144,2560,8,160,4,8,balanced,0.10925867160161336
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,6144,2560,8,160,4,8,balanced,0.043866669138272606
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,6144,2560,8,160,4,8,balanced,0.26743467648824054
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,6144,2560,8,160,4,8,balanced,0.11120532949765523
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,6144,2560,8,160,4,8,power_law_1.01,0.0881600022315979
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,6144,2560,8,160,4,8,balanced,0.046037331223487854
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,6144,2560,8,160,4,8,balanced,0.11182933052380879
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,6144,2560,8,160,4,8,balanced,0.2399946649869283
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,6144,2560,8,160,4,8,balanced,0.11345600088437398
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,6144,2560,8,160,2,16,power_law_1.2,0.2091264009475708
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,6144,2560,8,160,4,8,balanced,0.05194666484991709
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,6144,2560,8,160,4,8,power_law_1.01,0.10512000322341919
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,6144,2560,8,160,4,8,balanced,0.11585600177447002
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,6144,2560,8,160,4,8,balanced,0.06713066498438518
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,6144,2560,8,160,2,16,power_law_1.2,0.25230720043182375
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,6144,2560,8,160,4,8,power_law_1.01,0.06490880250930786
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,6144,2560,8,160,4,8,balanced,0.1223520040512085
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,6144,2560,8,160,4,8,balanced,0.09685333569844563
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,6144,2560,8,160,4,8,balanced,0.33737067381540936
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,6144,2560,8,160,4,8,balanced,0.10462400317192078
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,6144,2560,8,160,4,8,balanced,0.1256480018297831
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,6144,2560,8,160,4,8,power_law_1.01,0.08106880187988282
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,6144,2560,8,160,4,8,balanced,0.1316373348236084
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,6144,2560,8,160,2,16,power_law_1.2,0.31090559959411623
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,6144,2560,8,160,4,8,balanced,0.10648000240325928
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,6144,2560,8,160,4,8,power_law_1.01,0.09880959987640381
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,6144,2560,8,160,4,8,balanced,0.1667893330256144
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,6144,2560,8,160,4,8,balanced,0.35178132851918537
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,6144,2560,8,160,4,8,balanced,0.10713600118954976
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,6144,2560,8,160,2,16,power_law_1.2,0.3611455917358398
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,6144,2560,8,160,4,8,power_law_1.01,0.1352255940437317
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,6144,2560,8,160,4,8,balanced,0.10839999715487163
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,6144,2560,8,160,4,8,balanced,0.15812266866366068
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,6144,2560,8,160,2,16,power_law_1.2,0.545900821685791
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,6144,2560,8,160,4,8,balanced,0.11001599828402202
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,6144,2560,8,160,4,8,power_law_1.01,0.13260159492492676
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,6144,2560,8,160,4,8,balanced,0.21155200401941934
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,6144,2560,8,160,4,8,balanced,0.11162666479746501
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,6144,2560,8,160,2,16,power_law_1.2,0.7243519783020019
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,6144,2560,8,160,4,8,balanced,0.5579679807027181
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,6144,2560,8,160,4,8,power_law_1.01,0.14238719940185546
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,6144,2560,8,160,4,8,balanced,0.2097973426183065
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,6144,2560,8,160,4,8,balanced,0.11312533418337505
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,6144,2560,8,160,4,8,power_law_1.01,0.14802559614181518
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,6144,2560,8,160,4,8,balanced,0.11629866560300191
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,6144,2560,8,160,2,16,power_law_1.2,0.9833600044250488
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,6144,2560,8,160,4,8,balanced,0.2860586643218994
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,6144,2560,8,160,4,8,power_law_1.01,0.1529536008834839
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,6144,2560,8,160,4,8,balanced,0.11924266815185547
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,6144,2560,8,160,4,8,power_law_1.01,0.15701760053634645
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,6144,2560,8,160,4,8,balanced,0.12607999642690024
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,6144,2560,8,160,2,16,power_law_1.2,1.5836288452148437
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,6144,2560,8,160,4,8,balanced,0.6168053150177002
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,6144,2560,8,160,4,8,balanced,0.3241386612256368
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,6144,2560,8,160,4,8,power_law_1.01,0.15998079776763915
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,6144,2560,8,160,2,16,power_law_1.2,2.231916809082031
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,6144,2560,8,160,4,8,power_law_1.01,0.16261759996414185
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,6144,2560,8,160,2,16,power_law_1.2,2.977004814147949
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,6144,2560,8,160,4,8,power_law_1.01,0.17726720571517945
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,6144,2560,8,160,4,8,balanced,0.4869759877522786
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,6144,2560,8,160,4,8,balanced,0.13190399607022604
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,6144,2560,8,160,2,16,power_law_1.2,4.039398574829102
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,6144,2560,8,160,4,8,power_law_1.01,0.18547840118408204
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,6144,2560,8,160,4,8,power_law_1.01,0.19372160434722902
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,6144,2560,8,160,4,8,balanced,0.7589706579844157
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,6144,2560,8,160,2,16,power_law_1.2,5.909260940551758
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,6144,2560,8,160,4,8,power_law_1.01,0.20777599811553954
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,6144,2560,8,160,4,8,balanced,0.5686879952748617
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,6144,2560,8,160,4,8,power_law_1.01,0.24274559020996095
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,6144,2560,8,160,4,8,power_law_1.01,0.06521599888801574
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,6144,2560,8,160,4,8,balanced,0.14019733667373657
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,6144,2560,8,160,2,16,power_law_1.2,13.467193603515625
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,6144,2560,8,160,4,8,power_law_1.01,0.2488447904586792
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,6144,2560,8,160,4,8,power_law_1.01,0.07576320171356202
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,6144,2560,8,160,4,8,power_law_1.01,0.3181056022644043
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,6144,2560,8,160,4,8,power_law_1.01,0.05249279737472534
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,6144,2560,8,160,4,8,power_law_1.01,0.338483190536499
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,6144,2560,8,160,4,8,power_law_1.01,0.07043840289115906
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,6144,2560,8,160,4,8,power_law_1.01,0.44406399726867674
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,6144,2560,8,160,4,8,balanced,1.0246133009592693
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,6144,2560,8,160,4,8,balanced,0.7597013314565023
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,6144,2560,8,160,4,8,power_law_1.01,0.0763647973537445
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,6144,2560,8,160,4,8,balanced,0.16105600198109946
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,6144,2560,8,160,4,8,power_law_1.01,0.5259520053863526
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,6144,2560,8,160,4,8,power_law_1.01,0.0972927987575531
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,6144,2560,8,160,4,8,power_law_1.01,0.707257604598999
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,6144,2560,8,160,4,8,balanced,0.17466666301091513
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,6144,2560,8,160,4,8,power_law_1.01,0.09945600032806397
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,6144,2560,8,160,4,8,power_law_1.01,0.8620863914489746
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,6144,2560,8,160,4,8,power_law_1.01,0.09859200119972229
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,6144,2560,8,160,4,8,power_law_1.01,0.10329600572586059
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,6144,2560,8,160,4,8,power_law_1.01,1.0922752380371095
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,6144,2560,8,160,4,8,power_law_1.01,0.10482560396194458
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,6144,2560,8,160,4,8,power_law_1.01,1.4057536125183105
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,6144,2560,8,160,4,8,balanced,1.0009600321451824
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,6144,2560,8,160,4,8,power_law_1.01,0.11018879413604736
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,6144,2560,8,160,4,8,power_law_1.01,1.8521791458129884
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,6144,2560,8,160,4,8,balanced,0.21280533075332642
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,6144,2560,8,160,4,8,power_law_1.01,0.10966399908065796
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,6144,2560,8,160,4,8,balanced,1.217509349187215
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,6144,2560,8,160,4,8,power_law_1.01,2.653139114379883
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,6144,2560,8,160,4,8,power_law_1.01,0.11845120191574096
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,6144,2560,8,160,4,8,balanced,0.2515466610590617
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,6144,2560,8,160,4,8,power_law_1.01,0.12224639654159546
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,6144,2560,8,160,4,8,power_law_1.01,5.359020614624024
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,6144,2560,8,160,4,8,power_law_1.01,0.12405760288238525
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,6144,2560,8,160,4,8,balanced,0.37969064712524414
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,6144,2560,8,160,4,8,power_law_1.01,0.13882240056991577
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,6144,2560,8,160,4,8,power_law_1.01,0.14268800020217895
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,6144,2560,8,160,4,8,power_law_1.01,0.17837439775466918
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,6144,2560,8,160,4,8,balanced,0.4553706645965576
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,6144,2560,8,160,4,8,power_law_1.01,0.1816704034805298
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,6144,2560,8,160,4,8,balanced,1.198474645614624
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,6144,2560,8,160,4,8,power_law_1.01,0.22315518856048583
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,6144,2560,8,160,4,8,power_law_1.01,0.26231679916381834
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,6144,2560,8,160,4,8,power_law_1.01,0.32873599529266356
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,6144,2560,8,160,4,8,balanced,0.6334559917449951
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,6144,2560,8,160,4,8,power_law_1.01,0.4370880126953125
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,6144,2560,8,160,4,8,power_law_1.01,0.06964480280876159
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,6144,2560,8,160,4,8,balanced,1.8383199373881023
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,6144,2560,8,160,4,8,power_law_1.01,0.5699903964996338
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,6144,2560,8,160,4,8,power_law_1.01,0.08642560243606567
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,6144,2560,8,160,4,8,power_law_1.01,0.055315202474594115
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,6144,2560,8,160,4,8,power_law_1.01,0.7259583950042725
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,6144,2560,8,160,4,8,power_law_1.2,0.08394880294799804
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,6144,2560,8,160,4,8,balanced,0.8335306644439697
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,6144,2560,8,160,4,8,power_law_1.01,0.06988800168037415
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,6144,2560,8,160,4,8,power_law_1.01,1.1019840240478516
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,6144,2560,8,160,4,8,power_law_1.2,0.06656640172004699
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,6144,2560,8,160,4,8,power_law_1.01,0.07726719975471497
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,6144,2560,8,160,4,8,power_law_1.01,1.3884096145629883
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,6144,2560,8,160,4,8,power_law_1.2,0.066348797082901
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,6144,2560,8,160,4,8,power_law_1.01,0.09772160053253173
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,6144,2560,8,160,4,8,power_law_1.2,0.08216959834098816
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,6144,2560,8,160,4,8,power_law_1.01,0.10245120525360107
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,6144,2560,8,160,4,8,power_law_1.01,1.619321632385254
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,6144,2560,8,160,4,8,power_law_1.01,0.10184320211410522
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,6144,2560,8,160,4,8,power_law_1.2,0.09704319834709167
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,6144,2560,8,160,4,8,balanced,1.849199930826823
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,6144,2560,8,160,4,8,power_law_1.01,2.4506431579589845
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,6144,2560,8,160,4,8,power_law_1.01,0.10536960363388062
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,6144,2560,8,160,4,8,balanced,1.1643359661102295
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,6144,2560,8,160,4,8,power_law_1.2,0.1307968020439148
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,6144,2560,8,160,4,8,power_law_1.01,0.1133952021598816
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,6144,2560,8,160,4,8,power_law_1.2,0.14488960504531861
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,6144,2560,8,160,4,8,power_law_1.01,5.130220794677735
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,6144,2560,8,160,4,8,power_law_1.01,0.11892479658126831
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,6144,2560,8,160,4,8,power_law_1.2,0.14561920166015624
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,6144,2560,8,160,4,8,power_law_1.01,0.1229375958442688
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,6144,2560,8,160,4,8,power_law_1.2,0.15359359979629517
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,6144,2560,8,160,4,8,power_law_1.01,0.1282240033149719
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,6144,2560,8,160,4,8,power_law_1.2,0.15296640396118164
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,6144,2560,8,160,4,8,power_law_1.01,0.14179840087890624
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,6144,2560,8,160,4,8,power_law_1.2,0.16095999479293824
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,6144,2560,8,160,4,8,power_law_1.01,0.15499520301818848
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,6144,2560,8,160,4,8,balanced,1.549557367960612
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,6144,2560,8,160,4,8,power_law_1.2,0.16368639469146729
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,6144,2560,8,160,4,8,power_law_1.2,0.16881920099258424
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,6144,2560,8,160,4,8,power_law_1.01,0.1560639977455139
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,6144,2560,8,160,4,8,power_law_1.2,0.17503999471664428
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,6144,2560,8,160,4,8,power_law_1.2,0.19308799505233765
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,6144,2560,8,160,4,8,power_law_1.2,0.1959231972694397
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,6144,2560,8,160,4,8,power_law_1.01,0.17285759449005128
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,6144,2560,8,160,4,8,power_law_1.2,0.22425599098205568
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,6144,2560,8,160,4,8,power_law_1.2,0.2632960081100464
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,6144,2560,8,160,4,8,power_law_1.01,0.1991039991378784
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,6144,2560,8,160,4,8,power_law_1.2,0.2571903944015503
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,6144,2560,8,160,4,8,balanced,1.8985066413879395
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,6144,2560,8,160,4,8,power_law_1.01,0.22979199886322021
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,6144,2560,8,160,4,8,power_law_1.2,0.3243711948394775
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,6144,2560,8,160,4,8,balanced,3.6566025416056314
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,6144,2560,8,160,4,8,power_law_1.2,0.38842880725860596
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,6144,2560,8,160,4,8,power_law_1.01,0.2993920087814331
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,6144,2560,8,160,4,8,power_law_1.2,0.5105343818664551
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,6144,2560,8,160,4,8,power_law_1.01,0.3676095962524414
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,6144,2560,8,160,4,8,power_law_1.2,0.5764480113983155
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,6144,2560,8,160,4,8,power_law_1.01,0.511891222000122
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,6144,2560,8,160,4,8,power_law_1.2,0.7654592037200928
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,6144,2560,8,160,4,8,power_law_1.01,0.6569664001464843
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,6144,2560,8,160,4,8,power_law_1.2,0.8906559944152832
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,6144,2560,8,160,4,8,power_law_1.2,1.3327232360839845
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,6144,2560,8,160,4,8,power_law_1.01,0.9261183738708496
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,6144,2560,8,160,4,8,balanced,3.6715466181437173
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,6144,2560,8,160,4,8,power_law_1.2,2.0223295211791994
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,6144,2560,8,160,4,8,power_law_1.01,1.1596799850463868
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,6144,2560,8,160,4,8,power_law_1.01,1.7822208404541016
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,6144,2560,8,160,4,8,power_law_1.2,2.727097511291504
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,6144,2560,8,160,4,8,power_law_1.01,2.6081600189208984
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,6144,2560,8,160,4,8,balanced,2.962741216023763
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,6144,2560,8,160,4,8,power_law_1.2,3.4483585357666016
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,6144,2560,8,160,4,8,power_law_1.01,2.942393684387207
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,6144,2560,8,160,4,8,power_law_1.2,8.11475830078125
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,6144,2560,8,160,4,8,power_law_1.01,4.3845375061035154
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,6144,2560,8,160,4,8,power_law_1.01,9.952230072021484
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,6144,2560,8,160,4,8,power_law_1.2,0.06216319799423218
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,6144,2560,8,160,4,8,power_law_1.2,0.055827200412750244
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,6144,2560,8,160,4,8,power_law_1.2,0.0531391978263855
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,6144,2560,8,160,4,8,power_law_1.2,0.06503679752349853
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,6144,2560,8,160,4,8,power_law_1.2,0.0728767991065979
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,6144,2560,8,160,4,8,power_law_1.2,0.09483519792556763
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,6144,2560,8,160,4,8,power_law_1.2,0.09514240026474
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,6144,2560,8,160,4,8,balanced,5.917738596598308
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,6144,2560,8,160,4,8,power_law_1.2,0.10272639989852905
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,6144,2560,8,160,4,8,power_law_1.2,0.10398080348968505
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,6144,2560,8,160,4,8,power_law_1.2,0.10474879741668701
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,6144,2560,8,160,4,8,power_law_1.2,0.11073280572891235
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,6144,2560,8,160,4,8,power_law_1.2,0.11397759914398194
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,6144,2560,8,160,4,8,power_law_1.2,0.11797759532928467
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,6144,2560,8,160,4,8,power_law_1.2,0.12412799596786499
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,6144,2560,8,160,4,8,power_law_1.2,0.13557759523391724
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,6144,2560,8,160,4,8,power_law_1.2,0.13329919576644897
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,6144,2560,8,160,4,8,power_law_1.2,0.06815999746322632
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,6144,2560,8,160,4,8,power_law_1.2,0.154585599899292
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,6144,2560,8,160,4,8,power_law_1.2,0.05546879768371582
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,6144,2560,8,160,4,8,power_law_1.2,0.18503040075302124
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,6144,2560,8,160,4,8,power_law_1.2,0.0545087993144989
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,6144,2560,8,160,4,8,power_law_1.2,0.1956544041633606
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,6144,2560,8,160,4,8,power_law_1.2,0.06789119839668274
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,6144,2560,8,160,4,8,power_law_1.2,0.262227201461792
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,6144,2560,8,160,4,8,power_law_1.2,0.07111679911613464
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,6144,2560,8,160,4,8,power_law_1.2,0.28422400951385496
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,6144,2560,8,160,4,8,power_law_1.2,0.09932159781455993
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,6144,2560,8,160,4,8,power_law_1.2,0.36663041114807127
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,6144,2560,8,160,4,8,power_law_1.2,0.10199040174484253
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,6144,2560,8,160,4,8,power_law_1.2,0.49930877685546876
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,6144,2560,8,160,4,8,power_law_1.2,0.1047935962677002
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,6144,2560,8,160,4,8,power_law_1.2,0.626643180847168
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,6144,2560,8,160,4,8,power_law_1.2,0.10542080402374268
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,6144,2560,8,160,4,8,power_law_1.2,0.8278464317321778
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,6144,2560,8,160,4,8,power_law_1.2,0.11232000589370728
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,6144,2560,8,160,8,4,balanced,0.05259733398755392
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,6144,2560,8,160,4,8,power_law_1.2,1.1570688247680665
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,6144,2560,8,160,4,8,power_law_1.2,0.12128000259399414
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,6144,2560,8,160,8,4,balanced,0.05596800148487091
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,6144,2560,8,160,4,8,power_law_1.2,1.4917568206787108
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,6144,2560,8,160,4,8,power_law_1.2,0.1339840054512024
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,6144,2560,8,160,8,4,balanced,0.06332266827424367
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,6144,2560,8,160,4,8,power_law_1.2,0.13215999603271483
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,6144,2560,8,160,4,8,power_law_1.2,1.9908607482910157
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,6144,2560,8,160,8,4,balanced,0.09143466750780742
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,6144,2560,8,160,8,4,balanced,0.12925333778063455
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,6144,2560,8,160,4,8,power_law_1.2,0.1389631986618042
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,6144,2560,8,160,4,8,power_law_1.2,3.656070327758789
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,6144,2560,8,160,8,4,balanced,0.15331199765205383
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,6144,2560,8,160,4,8,power_law_1.2,0.1642367959022522
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,6144,2560,8,160,8,4,balanced,0.1532906691233317
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,6144,2560,8,160,4,8,power_law_1.2,7.037567901611328
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,6144,2560,8,160,8,4,balanced,0.1540426711241404
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,6144,2560,8,160,4,8,power_law_1.2,0.16928000450134278
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,6144,2560,8,160,8,4,balanced,0.15493333339691162
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,6144,2560,8,160,8,4,balanced,0.1553759972254435
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,6144,2560,8,160,8,4,balanced,0.16115199526151022
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,6144,2560,8,160,4,8,power_law_1.2,0.16620800495147706
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,6144,2560,8,160,8,4,balanced,0.1637279987335205
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,6144,2560,8,160,8,4,balanced,0.16470932960510254
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,6144,2560,8,160,4,8,power_law_1.2,0.22200961112976075
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,6144,2560,8,160,8,4,balanced,0.16800532738367716
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,6144,2560,8,160,4,8,power_law_1.2,0.24887681007385254
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,6144,2560,8,160,8,4,balanced,0.17620267470677695
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,6144,2560,8,160,8,4,balanced,0.1816906730333964
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,6144,2560,8,160,4,8,power_law_1.2,0.3330687999725342
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,6144,2560,8,160,8,4,balanced,0.18865066766738892
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,6144,2560,8,160,4,8,power_law_1.2,0.42830719947814944
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,6144,2560,8,160,8,4,balanced,0.2605440020561218
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,6144,2560,8,160,4,8,power_law_1.2,0.5620927810668945
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,6144,2560,8,160,8,4,balanced,0.22604799270629883
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,6144,2560,8,160,8,4,balanced,0.0465280016263326
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,6144,2560,8,160,4,8,power_law_1.2,0.7837440013885498
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,6144,2560,8,160,8,4,balanced,0.049839998284975685
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,6144,2560,8,160,8,4,balanced,0.32689066727956134
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,6144,2560,8,160,8,4,balanced,0.05563733478387197
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,6144,2560,8,160,4,8,power_law_1.2,1.1508671760559082
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,6144,2560,8,160,8,4,balanced,0.07419200241565704
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,6144,2560,8,160,8,4,balanced,0.10449066758155823
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,6144,2560,8,160,8,4,balanced,0.28004799286524457
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,6144,2560,8,160,4,8,power_law_1.2,1.356544017791748
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,6144,2560,8,160,8,4,balanced,0.11282666524251302
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,6144,2560,8,160,4,8,power_law_1.2,2.2670591354370115
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,6144,2560,8,160,8,4,balanced,0.11521066228548686
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,6144,2560,8,160,8,4,balanced,0.11626666784286499
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,6144,2560,8,160,8,4,balanced,0.416922648747762
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,6144,2560,8,160,4,8,power_law_1.2,2.9198335647583007
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,6144,2560,8,160,8,4,balanced,0.11726933717727661
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,6144,2560,8,160,8,4,balanced,0.11789333820343018
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,6144,2560,8,160,4,8,power_law_1.2,3.359455871582031
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,6144,2560,8,160,8,4,balanced,0.05013866722583771
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,6144,2560,8,160,8,4,balanced,0.11982933680216472
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,6144,2560,8,160,8,4,balanced,0.42130664984385174
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,6144,2560,8,160,8,4,power_law_1.01,0.06541439890861511
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,6144,2560,8,160,8,4,balanced,0.12261866529782613
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,6144,2560,8,160,8,4,balanced,0.053632001082102455
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,6144,2560,8,160,4,8,power_law_1.2,5.313894271850586
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,6144,2560,8,160,8,4,balanced,0.124399999777476
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,6144,2560,8,160,8,4,power_law_1.01,0.0709824025630951
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,6144,2560,8,160,8,4,balanced,0.057573333382606506
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,6144,2560,8,160,8,4,balanced,0.12878933548927307
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,6144,2560,8,160,8,4,balanced,0.07450133562088013
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,6144,2560,8,160,8,4,power_law_1.01,0.0664255976676941
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,6144,2560,8,160,8,4,balanced,0.13731732964515686
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,6144,2560,8,160,4,8,power_law_1.2,13.150175476074219
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,6144,2560,8,160,8,4,balanced,0.6812586784362793
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,6144,2560,8,160,8,4,balanced,0.14081066846847534
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,6144,2560,8,160,8,4,balanced,0.10562666257222493
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,6144,2560,8,160,8,4,power_law_1.01,0.0874176025390625
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,6144,2560,8,160,8,4,balanced,0.14677866299947104
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,6144,2560,8,160,8,4,balanced,0.11468799908955891
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,6144,2560,8,160,8,4,power_law_1.01,0.09747840166091919
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,6144,2560,8,160,8,4,balanced,0.18573333819707236
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,6144,2560,8,160,8,4,balanced,0.1169706682364146
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,6144,2560,8,160,8,4,power_law_1.01,0.12277120351791382
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,6144,2560,8,160,8,4,balanced,0.18497600158055624
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,6144,2560,8,160,8,4,power_law_1.01,0.05443199872970581
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,6144,2560,8,160,8,4,balanced,0.11799466609954834
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,6144,2560,8,160,8,4,power_law_1.01,0.13675520420074463
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,6144,2560,8,160,8,4,balanced,0.7635839780171713
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,6144,2560,8,160,8,4,balanced,0.23653332392374674
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,6144,2560,8,160,8,4,power_law_1.01,0.06175360083580017
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,6144,2560,8,160,8,4,balanced,0.12034133076667786
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,6144,2560,8,160,8,4,power_law_1.01,0.14176000356674195
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,6144,2560,8,160,8,4,power_law_1.01,0.054995197057724
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,6144,2560,8,160,8,4,balanced,0.12212799986203511
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,6144,2560,8,160,8,4,balanced,0.24754132827123007
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,6144,2560,8,160,8,4,power_law_1.01,0.14737279415130616
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,6144,2560,8,160,8,4,power_law_1.01,0.06682239770889283
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,6144,2560,8,160,8,4,balanced,0.12495467066764832
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,6144,2560,8,160,8,4,power_law_1.01,0.14962559938430786
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,6144,2560,8,160,8,4,balanced,0.3452693223953247
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,6144,2560,8,160,8,4,power_law_1.01,0.07919359803199769
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,6144,2560,8,160,8,4,balanced,0.12809066971143088
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,6144,2560,8,160,8,4,power_law_1.01,0.15845119953155518
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,6144,2560,8,160,8,4,balanced,0.13249066472053528
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,6144,2560,8,160,8,4,power_law_1.01,0.103603196144104
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,6144,2560,8,160,8,4,balanced,0.39824533462524414
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,6144,2560,8,160,8,4,power_law_1.01,0.16681599617004395
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,6144,2560,8,160,8,4,balanced,1.1186933517456055
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,6144,2560,8,160,8,4,balanced,0.13875733812650046
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,6144,2560,8,160,8,4,power_law_1.01,0.10336639881134033
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,6144,2560,8,160,8,4,power_law_1.01,0.1804095983505249
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,6144,2560,8,160,8,4,balanced,0.1474293371041616
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,6144,2560,8,160,8,4,power_law_1.01,0.10824960470199585
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,6144,2560,8,160,8,4,power_law_1.01,0.17842559814453124
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,6144,2560,8,160,8,4,power_law_1.01,0.1115839958190918
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,6144,2560,8,160,8,4,balanced,0.6143253246943156
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,6144,2560,8,160,8,4,power_law_1.01,0.1879744052886963
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,6144,2560,8,160,8,4,power_law_1.01,0.11325440406799317
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,6144,2560,8,160,8,4,power_law_1.01,0.19584640264511108
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,6144,2560,8,160,8,4,power_law_1.01,0.11961599588394164
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,6144,2560,8,160,8,4,balanced,0.15962666273117065
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,6144,2560,8,160,8,4,power_law_1.01,0.23518719673156738
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,6144,2560,8,160,8,4,power_law_1.01,0.12467199563980103
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,6144,2560,8,160,8,4,balanced,0.7328373591105143
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,6144,2560,8,160,8,4,power_law_1.01,0.25953919887542726
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,6144,2560,8,160,8,4,power_law_1.01,0.1306175947189331
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,6144,2560,8,160,8,4,balanced,1.4529120127360027
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,6144,2560,8,160,8,4,power_law_1.01,0.26735360622406007
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,6144,2560,8,160,8,4,power_law_1.01,0.1322111964225769
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,6144,2560,8,160,8,4,power_law_1.01,0.3330048084259033
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,6144,2560,8,160,8,4,power_law_1.01,0.14009599685668944
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,6144,2560,8,160,8,4,balanced,0.17217065890630087
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,6144,2560,8,160,8,4,power_law_1.01,0.3830399990081787
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,6144,2560,8,160,8,4,power_law_1.01,0.15294079780578612
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,6144,2560,8,160,8,4,power_law_1.01,0.4719552040100098
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,6144,2560,8,160,8,4,power_law_1.01,0.1683776021003723
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,6144,2560,8,160,8,4,balanced,1.0589439868927002
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,6144,2560,8,160,8,4,power_law_1.01,0.19846400022506713
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,6144,2560,8,160,8,4,power_law_1.01,0.5940095901489257
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,6144,2560,8,160,8,4,power_law_1.01,0.20527360439300538
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,6144,2560,8,160,8,4,power_law_1.01,0.7826047897338867
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,6144,2560,8,160,8,4,power_law_1.01,0.26956160068511964
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,6144,2560,8,160,8,4,balanced,0.211626668771108
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,6144,2560,8,160,8,4,power_law_1.01,0.972383975982666
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,6144,2560,8,160,8,4,balanced,1.5793066024780273
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,6144,2560,8,160,8,4,power_law_1.01,0.2933120012283325
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,6144,2560,8,160,8,4,balanced,0.24418665965398154
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,6144,2560,8,160,8,4,power_law_1.01,1.2605952262878417
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,6144,2560,8,160,8,4,power_law_1.01,0.061919999122619626
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,6144,2560,8,160,8,4,power_law_1.01,0.3964416027069092
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,6144,2560,8,160,8,4,power_law_1.01,1.7319232940673828
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,6144,2560,8,160,8,4,power_law_1.01,0.06555520296096802
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,6144,2560,8,160,8,4,power_law_1.01,0.5053055763244629
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,6144,2560,8,160,8,4,power_law_1.01,2.186079978942871
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,6144,2560,8,160,8,4,balanced,1.352234681447347
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,6144,2560,8,160,8,4,power_law_1.01,0.05885440111160278
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,6144,2560,8,160,8,4,power_law_1.01,0.6985856056213379
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,6144,2560,8,160,8,4,power_law_1.01,0.07249919772148132
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,6144,2560,8,160,8,4,balanced,0.328490674495697
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,6144,2560,8,160,8,4,power_law_1.01,3.2729278564453126
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,6144,2560,8,160,8,4,power_law_1.01,0.8442879676818847
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,6144,2560,8,160,8,4,power_law_1.01,0.08156160116195679
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,6144,2560,8,160,8,4,balanced,0.38923199971516925
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,6144,2560,8,160,8,4,power_law_1.01,0.1040768027305603
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,6144,2560,8,160,8,4,power_law_1.01,1.2479999542236329
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,6144,2560,8,160,8,4,power_law_1.01,6.533638763427734
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,6144,2560,8,160,8,4,power_law_1.01,0.1130687952041626
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,6144,2560,8,160,8,4,power_law_1.01,1.5685952186584473
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,6144,2560,8,160,8,4,balanced,0.5687573353449503
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,6144,2560,8,160,8,4,power_law_1.01,0.11518080234527588
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,6144,2560,8,160,8,4,power_law_1.01,2.030950355529785
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,6144,2560,8,160,8,4,power_law_1.01,0.11902719736099243
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,6144,2560,8,160,8,4,power_law_1.01,3.5163265228271485
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,6144,2560,8,160,8,4,power_law_1.01,0.12098560333251954
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,6144,2560,8,160,8,4,balanced,0.6922986507415771
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,6144,2560,8,160,8,4,balanced,1.5951253573099773
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,6144,2560,8,160,8,4,power_law_1.01,0.13512320518493653
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,6144,2560,8,160,8,4,power_law_1.01,5.986016082763672
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,6144,2560,8,160,8,4,power_law_1.01,0.13774720430374146
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,6144,2560,8,160,8,4,balanced,2.520400047302246
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,6144,2560,8,160,8,4,balanced,0.9902933438618978
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,6144,2560,8,160,8,4,power_law_1.01,0.15036799907684326
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,6144,2560,8,160,8,4,power_law_1.01,0.16442879438400268
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,6144,2560,8,160,8,4,power_law_1.01,0.18568320274353028
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,6144,2560,8,160,8,4,balanced,1.3035199642181396
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,6144,2560,8,160,8,4,power_law_1.01,0.18213759660720824
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,6144,2560,8,160,8,4,power_law_1.2,0.06572160124778748
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,6144,2560,8,160,8,4,power_law_1.2,0.06050559878349304
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,6144,2560,8,160,8,4,power_law_1.01,0.20728960037231445
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,6144,2560,8,160,8,4,power_law_1.2,0.06549760103225707
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,6144,2560,8,160,8,4,balanced,1.8359999656677246
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,6144,2560,8,160,8,4,power_law_1.2,0.07793920040130616
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,6144,2560,8,160,8,4,balanced,2.4904799461364746
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,6144,2560,8,160,8,4,power_law_1.01,0.24674561023712158
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,6144,2560,8,160,8,4,power_law_1.2,0.09351040124893188
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,6144,2560,8,160,8,4,power_law_1.01,0.29247360229492186
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,6144,2560,8,160,8,4,power_law_1.2,0.12817280292510985
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,6144,2560,8,160,8,4,power_law_1.2,0.13566720485687256
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,6144,2560,8,160,8,4,power_law_1.01,0.40764799118041994
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,6144,2560,8,160,8,4,power_law_1.2,0.13943040370941162
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,6144,2560,8,160,8,4,power_law_1.01,0.4789440155029297
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,6144,2560,8,160,8,4,power_law_1.2,0.15004160404205322
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,6144,2560,8,160,8,4,power_law_1.01,0.6818560123443603
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,6144,2560,8,160,8,4,power_law_1.2,0.14885120391845702
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,6144,2560,8,160,8,4,power_law_1.01,0.8542911529541015
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,6144,2560,8,160,8,4,balanced,2.4454506238301597
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,6144,2560,8,160,8,4,power_law_1.2,0.16263680458068847
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,6144,2560,8,160,8,4,power_law_1.01,1.297811222076416
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,6144,2560,8,160,8,4,power_law_1.2,0.1751680016517639
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,6144,2560,8,160,8,4,power_law_1.01,1.7402559280395509
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,6144,2560,8,160,8,4,power_law_1.2,0.1794368028640747
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,6144,2560,8,160,8,4,power_law_1.01,2.3357311248779298
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,6144,2560,8,160,8,4,power_law_1.2,0.18401919603347777
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,6144,2560,8,160,8,4,power_law_1.01,3.002751922607422
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,6144,2560,8,160,8,4,power_law_1.2,0.19216639995574952
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,6144,2560,8,160,8,4,power_law_1.2,0.2024384021759033
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,6144,2560,8,160,8,4,power_law_1.01,3.80450553894043
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,6144,2560,8,160,8,4,power_law_1.2,0.24305920600891112
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,6144,2560,8,160,8,4,balanced,4.774869283040364
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,6144,2560,8,160,8,4,power_law_1.01,6.4687744140625
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,6144,2560,8,160,8,4,balanced,3.0002772013346353
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,6144,2560,8,160,8,4,power_law_1.2,0.2840768098831177
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,6144,2560,8,160,8,4,power_law_1.2,0.287827205657959
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,6144,2560,8,160,8,4,power_law_1.01,12.092211151123047
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,6144,2560,8,160,8,4,power_law_1.2,0.3782464027404785
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,6144,2560,8,160,8,4,power_law_1.2,0.3878079891204834
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,6144,2560,8,160,8,4,power_law_1.2,0.5080255985260009
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,6144,2560,8,160,8,4,power_law_1.2,0.6698304176330566
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,6144,2560,8,160,8,4,power_law_1.2,0.8578944206237793
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,6144,2560,8,160,8,4,power_law_1.2,1.0125247955322265
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,6144,2560,8,160,8,4,balanced,4.859706560770671
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,6144,2560,8,160,8,4,power_law_1.2,1.4884991645812988
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,6144,2560,8,160,8,4,power_law_1.2,0.0541375994682312
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,6144,2560,8,160,8,4,power_law_1.2,1.8754560470581054
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,6144,2560,8,160,8,4,power_law_1.2,0.05187839865684509
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,6144,2560,8,160,8,4,balanced,4.751445452372233
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,6144,2560,8,160,8,4,power_law_1.2,0.05355520248413086
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,6144,2560,8,160,8,4,power_law_1.2,2.2910015106201174
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,6144,2560,8,160,8,4,power_law_1.2,0.0668287992477417
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,6144,2560,8,160,8,4,power_law_1.2,3.971104049682617
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,6144,2560,8,160,8,4,power_law_1.2,0.07461760044097901
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,6144,2560,8,160,8,4,power_law_1.2,0.10076800584793091
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,6144,2560,8,160,8,4,power_law_1.2,8.553997039794922
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,6144,2560,8,160,8,4,power_law_1.2,0.10491520166397095
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,6144,2560,8,160,8,4,power_law_1.2,0.10803200006484985
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,6144,2560,8,160,8,4,power_law_1.2,0.1125823974609375
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,6144,2560,8,160,8,4,power_law_1.2,0.11319040060043335
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,6144,2560,8,160,8,4,power_law_1.2,0.12332799434661865
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,6144,2560,8,160,8,4,power_law_1.2,0.1287935972213745
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,6144,2560,8,160,8,4,power_law_1.2,0.13598719835281373
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,6144,2560,8,160,8,4,power_law_1.2,0.1311743974685669
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,6144,2560,8,160,8,4,power_law_1.2,0.14769920110702514
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,6144,2560,8,160,8,4,power_law_1.2,0.14970879554748534
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,6144,2560,8,160,8,4,power_law_1.2,0.16838400363922118
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,6144,2560,8,160,8,4,power_law_1.2,0.1988927960395813
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,6144,2560,8,160,8,4,power_law_1.2,0.224070405960083
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,6144,2560,8,160,8,4,power_law_1.2,0.2729599952697754
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,6144,2560,8,160,8,4,power_law_1.2,0.31033599376678467
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,6144,2560,8,160,8,4,power_law_1.2,0.4171584129333496
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,6144,2560,8,160,8,4,power_law_1.2,0.5182720184326172
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,6144,2560,8,160,8,4,balanced,9.442933400472006
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,6144,2560,8,160,8,4,power_law_1.2,0.7769343852996826
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,6144,2560,8,160,8,4,power_law_1.2,1.0831999778747559
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,6144,2560,8,160,8,4,power_law_1.2,1.3681792259216308
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,6144,2560,8,160,8,4,power_law_1.2,1.7009727478027343
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,6144,2560,8,160,8,4,power_law_1.2,2.066745567321777
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,6144,2560,8,160,8,4,power_law_1.2,0.06080639958381653
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,6144,2560,8,160,8,4,power_law_1.2,3.7057918548583983
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,6144,2560,8,160,8,4,power_law_1.2,0.0593280017375946
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,6144,2560,8,160,8,4,power_law_1.2,0.059622400999069215
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,6144,2560,8,160,16,2,balanced,0.05417599777380625
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,6144,2560,8,160,8,4,power_law_1.2,7.9163330078125
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,6144,2560,8,160,8,4,power_law_1.2,0.06930559873580933
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,6144,2560,8,160,16,2,balanced,0.061306665341059365
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,6144,2560,8,160,16,2,balanced,0.07427200178305308
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,6144,2560,8,160,8,4,power_law_1.2,0.07825279831886292
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,6144,2560,8,160,16,2,balanced,0.10431466499964397
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,6144,2560,8,160,8,4,power_law_1.2,0.1056704044342041
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,6144,2560,8,160,16,2,balanced,0.1483840048313141
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,6144,2560,8,160,8,4,power_law_1.2,0.10994559526443481
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,6144,2560,8,160,16,2,balanced,0.17310933272043863
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,6144,2560,8,160,8,4,power_law_1.2,0.11248639822006226
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,6144,2560,8,160,16,2,balanced,0.17430400848388672
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,6144,2560,8,160,8,4,power_law_1.2,0.12220799922943115
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,6144,2560,8,160,16,2,balanced,0.17818133036295572
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,6144,2560,8,160,8,4,power_law_1.2,0.12145919799804687
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,6144,2560,8,160,16,2,balanced,0.17799466848373413
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,6144,2560,8,160,8,4,power_law_1.2,0.1357375979423523
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,6144,2560,8,160,16,2,balanced,0.18295466899871826
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,6144,2560,8,160,8,4,power_law_1.2,0.14535679817199706
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,6144,2560,8,160,16,2,balanced,0.18362667163213095
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,6144,2560,8,160,8,4,power_law_1.2,0.15664639472961425
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,6144,2560,8,160,16,2,balanced,0.18725866079330444
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,6144,2560,8,160,16,2,balanced,0.190010666847229
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,6144,2560,8,160,8,4,power_law_1.2,0.16224000453948975
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,6144,2560,8,160,16,2,balanced,0.1972000002861023
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,6144,2560,8,160,8,4,power_law_1.2,0.18408960103988647
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,6144,2560,8,160,16,2,balanced,0.20624534289042154
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,6144,2560,8,160,16,2,balanced,0.2121760050455729
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,6144,2560,8,160,8,4,power_law_1.2,0.19198720455169677
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,6144,2560,8,160,16,2,balanced,0.21686400969823202
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,6144,2560,8,160,16,2,balanced,0.281877338886261
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,6144,2560,8,160,16,2,balanced,0.274453341960907
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,6144,2560,8,160,8,4,power_law_1.2,0.2058176040649414
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,6144,2560,8,160,16,2,balanced,0.3549333413441976
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,6144,2560,8,160,8,4,power_law_1.2,0.2680896043777466
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,6144,2560,8,160,16,2,balanced,0.3766453266143799
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,6144,2560,8,160,8,4,power_law_1.2,0.30147199630737304
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,6144,2560,8,160,16,2,balanced,0.6033173402150472
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,6144,2560,8,160,8,4,power_law_1.2,0.44136319160461424
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,6144,2560,8,160,16,2,balanced,0.0489279975493749
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,6144,2560,8,160,8,4,power_law_1.2,0.5541183948516846
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,6144,2560,8,160,16,2,balanced,0.5872106552124023
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,6144,2560,8,160,16,2,balanced,0.05286933481693268
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,6144,2560,8,160,8,4,power_law_1.2,0.8473471641540528
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,6144,2560,8,160,16,2,balanced,0.061808000008265175
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,6144,2560,8,160,8,4,power_law_1.2,0.954201602935791
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,6144,2560,8,160,16,2,balanced,0.086709330479304
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,6144,2560,8,160,16,2,balanced,0.11888532837231953
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,6144,2560,8,160,8,4,power_law_1.2,1.2094528198242187
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,6144,2560,8,160,16,2,balanced,0.9937600294748942
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,6144,2560,8,160,16,2,balanced,0.14150933424631754
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,6144,2560,8,160,8,4,power_law_1.2,1.7161920547485352
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,6144,2560,8,160,16,2,balanced,0.14274666706720987
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,6144,2560,8,160,16,2,balanced,0.1362773378690084
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,6144,2560,8,160,8,4,power_law_1.2,2.700147247314453
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,6144,2560,8,160,16,2,balanced,0.14037866393725076
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,6144,2560,8,160,16,2,power_law_1.01,0.066348797082901
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,6144,2560,8,160,8,4,power_law_1.2,3.720729446411133
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,6144,2560,8,160,16,2,balanced,1.0885012944539387
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,6144,2560,8,160,16,2,balanced,0.14010666807492575
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,6144,2560,8,160,16,2,balanced,0.06502399841944377
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,6144,2560,8,160,16,2,power_law_1.01,0.0648959994316101
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,6144,2560,8,160,16,2,balanced,0.141375998655955
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,6144,2560,8,160,8,4,power_law_1.2,5.337260818481445
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,6144,2560,8,160,16,2,balanced,0.0689333329598109
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,6144,2560,8,160,16,2,power_law_1.01,0.06848639845848084
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,6144,2560,8,160,16,2,balanced,0.14409599701563516
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,6144,2560,8,160,16,2,balanced,0.07679999868075053
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,6144,2560,8,160,8,4,power_law_1.2,6.813702392578125
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,6144,2560,8,160,16,2,balanced,0.1469119985898336
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,6144,2560,8,160,16,2,power_law_1.01,0.08908799886703492
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,6144,2560,8,160,16,2,balanced,0.09914666414260864
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,6144,2560,8,160,16,2,balanced,0.1541973352432251
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,6144,2560,8,160,16,2,power_law_1.01,0.11162879467010497
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,6144,2560,8,160,16,2,balanced,0.13054399689038595
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,6144,2560,8,160,16,2,balanced,0.1625920037428538
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,6144,2560,8,160,16,2,balanced,1.6557226181030273
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,6144,2560,8,160,8,4,power_law_1.2,14.226451110839843
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,6144,2560,8,160,16,2,power_law_1.01,0.13991039991378784
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,6144,2560,8,160,16,2,balanced,0.1495733360449473
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,6144,2560,8,160,16,2,balanced,0.17006933689117432
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,6144,2560,8,160,16,2,power_law_1.01,0.15095679759979247
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,6144,2560,8,160,16,2,balanced,0.155157337586085
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,6144,2560,8,160,16,2,power_law_1.01,0.15765759944915772
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,6144,2560,8,160,16,2,balanced,0.1816213329633077
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,6144,2560,8,160,16,2,balanced,0.1558026671409607
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,6144,2560,8,160,16,2,power_law_1.01,0.16092159748077392
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,6144,2560,8,160,16,2,balanced,0.15957333644231161
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,6144,2560,8,160,16,2,balanced,0.2521173357963562
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,6144,2560,8,160,16,2,power_law_1.01,0.16618239879608154
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,6144,2560,8,160,16,2,balanced,0.16330666343371072
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,6144,2560,8,160,16,2,balanced,0.23785066604614258
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,6144,2560,8,160,16,2,balanced,0.17056532700856528
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,6144,2560,8,160,16,2,power_law_1.01,0.1762943983078003
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,6144,2560,8,160,16,2,balanced,0.2953333258628845
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,6144,2560,8,160,16,2,balanced,0.17646400133768717
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,6144,2560,8,160,16,2,power_law_1.01,0.18494720458984376
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,6144,2560,8,160,16,2,balanced,2.1042720476786294
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,6144,2560,8,160,16,2,power_law_1.01,0.05139840245246887
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,6144,2560,8,160,16,2,balanced,0.18353599309921265
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,6144,2560,8,160,16,2,power_law_1.01,0.1947711944580078
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,6144,2560,8,160,16,2,balanced,0.32604799667994183
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,6144,2560,8,160,16,2,power_law_1.01,0.05805439949035644
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,6144,2560,8,160,16,2,power_law_1.01,0.20284159183502198
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,6144,2560,8,160,16,2,balanced,0.19235734144846597
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,6144,2560,8,160,16,2,power_law_1.01,0.056467199325561525
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,6144,2560,8,160,16,2,power_law_1.01,0.23043839931488036
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,6144,2560,8,160,16,2,balanced,0.2027413249015808
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,6144,2560,8,160,16,2,balanced,0.4992533524831136
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,6144,2560,8,160,16,2,power_law_1.01,0.0739135980606079
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,6144,2560,8,160,16,2,power_law_1.01,0.24125440120697023
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,6144,2560,8,160,16,2,power_law_1.01,0.08390399813652039
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,6144,2560,8,160,16,2,power_law_1.01,0.2564287900924683
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,6144,2560,8,160,16,2,power_law_1.01,0.11526399850845337
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,6144,2560,8,160,16,2,power_law_1.01,0.3008255958557129
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,6144,2560,8,160,16,2,balanced,0.5777226686477661
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,6144,2560,8,160,16,2,power_law_1.01,0.12459520101547242
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,6144,2560,8,160,16,2,balanced,0.22553066412607828
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,6144,2560,8,160,16,2,power_law_1.01,0.33036160469055176
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,6144,2560,8,160,16,2,power_law_1.01,0.12855679988861085
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,6144,2560,8,160,16,2,power_law_1.01,0.13178880214691163
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,6144,2560,8,160,16,2,power_law_1.01,0.38353281021118163
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,6144,2560,8,160,16,2,power_law_1.01,0.13089280128479003
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,6144,2560,8,160,16,2,balanced,2.404202620188395
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,6144,2560,8,160,16,2,power_law_1.01,0.5051712036132813
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,6144,2560,8,160,16,2,power_law_1.01,0.14046720266342164
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,6144,2560,8,160,16,2,balanced,0.889893372853597
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,6144,2560,8,160,16,2,power_law_1.01,0.15096960067749024
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,6144,2560,8,160,16,2,power_law_1.01,0.6439551830291748
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,6144,2560,8,160,16,2,power_law_1.01,0.15406080484390258
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,6144,2560,8,160,16,2,balanced,0.2508586645126343
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,6144,2560,8,160,16,2,power_law_1.01,0.8172736167907715
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,6144,2560,8,160,16,2,power_law_1.01,0.15822720527648926
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,6144,2560,8,160,16,2,power_law_1.01,0.17633919715881347
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,6144,2560,8,160,16,2,power_law_1.01,1.0284031867980956
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,6144,2560,8,160,16,2,power_law_1.01,0.18362239599227906
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,6144,2560,8,160,16,2,balanced,1.0911359786987305
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,6144,2560,8,160,16,2,power_law_1.01,1.2231488227844238
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,6144,2560,8,160,16,2,power_law_1.01,0.2055295944213867
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,6144,2560,8,160,16,2,power_law_1.01,0.25753600597381593
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,6144,2560,8,160,16,2,power_law_1.01,1.8073728561401368
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,6144,2560,8,160,16,2,power_law_1.01,0.2611840009689331
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,6144,2560,8,160,16,2,balanced,0.3450293143590291
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,6144,2560,8,160,16,2,power_law_1.01,2.314975929260254
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,6144,2560,8,160,16,2,power_law_1.01,0.33201920986175537
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,6144,2560,8,160,16,2,power_law_1.01,0.380729603767395
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,6144,2560,8,160,16,2,balanced,0.40318934122721356
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,6144,2560,8,160,16,2,power_law_1.01,2.8922624588012695
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,6144,2560,8,160,16,2,power_law_1.01,0.06525440216064453
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,6144,2560,8,160,16,2,power_law_1.01,0.5122687816619873
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,6144,2560,8,160,16,2,balanced,1.6096800168355305
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,6144,2560,8,160,16,2,power_law_1.01,0.070169597864151
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,6144,2560,8,160,16,2,balanced,0.5357813437779745
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,6144,2560,8,160,16,2,power_law_1.01,4.285779190063477
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,6144,2560,8,160,16,2,power_law_1.01,0.6240447998046875
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,6144,2560,8,160,16,2,power_law_1.01,0.07326080203056336
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,6144,2560,8,160,16,2,power_law_1.01,0.908563232421875
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,6144,2560,8,160,16,2,power_law_1.01,0.08833919763565064
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,6144,2560,8,160,16,2,balanced,0.6452800035476685
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,6144,2560,8,160,16,2,power_law_1.01,8.729990386962891
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,6144,2560,8,160,16,2,power_law_1.01,1.1528191566467285
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,6144,2560,8,160,16,2,power_law_1.01,0.10107519626617431
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,6144,2560,8,160,16,2,balanced,3.7615572611490884
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,6144,2560,8,160,16,2,power_law_1.01,0.13376640081405639
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,6144,2560,8,160,16,2,power_law_1.01,1.652262306213379
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,6144,2560,8,160,16,2,balanced,0.9535679817199707
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,6144,2560,8,160,16,2,power_law_1.01,0.13965439796447754
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,6144,2560,8,160,16,2,power_law_1.01,2.096966361999512
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,6144,2560,8,160,16,2,power_law_1.01,0.14820480346679688
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,6144,2560,8,160,16,2,power_law_1.01,2.5678144454956056
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,6144,2560,8,160,16,2,balanced,2.023637294769287
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,6144,2560,8,160,16,2,power_law_1.01,0.15162240266799926
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,6144,2560,8,160,16,2,balanced,1.1829333305358887
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,6144,2560,8,160,16,2,power_law_1.01,4.150271987915039
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,6144,2560,8,160,16,2,power_law_1.01,0.16264959573745727
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,6144,2560,8,160,16,2,power_law_1.01,0.16649600267410278
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,6144,2560,8,160,16,2,power_law_1.01,8.893170928955078
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,6144,2560,8,160,16,2,power_law_1.01,0.18532480001449586
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,6144,2560,8,160,16,2,balanced,1.719802697499593
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,6144,2560,8,160,16,2,power_law_1.2,0.06565120220184326
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,6144,2560,8,160,16,2,power_law_1.01,0.19759999513626098
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,6144,2560,8,160,16,2,power_law_1.2,0.05867519974708557
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,6144,2560,8,160,16,2,power_law_1.01,0.21685760021209716
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,6144,2560,8,160,16,2,power_law_1.2,0.06730239987373351
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,6144,2560,8,160,16,2,power_law_1.01,0.24416000843048097
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,6144,2560,8,160,16,2,power_law_1.2,0.08517760038375854
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,6144,2560,8,160,16,2,balanced,2.2416532834370932
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,6144,2560,8,160,16,2,balanced,2.3963680267333984
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,6144,2560,8,160,16,2,power_law_1.2,0.10520319938659668
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,6144,2560,8,160,16,2,power_law_1.01,0.24469120502471925
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,6144,2560,8,160,16,2,power_law_1.2,0.14295680522918702
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,6144,2560,8,160,16,2,power_law_1.2,0.1536128044128418
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,6144,2560,8,160,16,2,power_law_1.2,0.1575744032859802
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,6144,2560,8,160,16,2,power_law_1.01,0.28513920307159424
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,6144,2560,8,160,16,2,power_law_1.2,0.16560640335083007
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,6144,2560,8,160,16,2,balanced,3.2261012395222983
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,6144,2560,8,160,16,2,power_law_1.2,0.1716480016708374
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,6144,2560,8,160,16,2,power_law_1.01,0.37502079010009765
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,6144,2560,8,160,16,2,power_law_1.2,0.1816704034805298
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,6144,2560,8,160,16,2,power_law_1.01,0.4379007816314697
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,6144,2560,8,160,16,2,power_law_1.2,0.18738559484481812
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,6144,2560,8,160,16,2,power_law_1.01,0.5960959911346435
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,6144,2560,8,160,16,2,power_law_1.2,0.19559040069580078
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,6144,2560,8,160,16,2,power_law_1.01,0.7519296169281006
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,6144,2560,8,160,16,2,power_law_1.2,0.21484160423278809
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,6144,2560,8,160,16,2,power_law_1.01,1.0194239616394043
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,6144,2560,8,160,16,2,power_law_1.2,0.23434879779815673
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,6144,2560,8,160,16,2,power_law_1.01,1.3424639701843262
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,6144,2560,8,160,16,2,power_law_1.2,0.24110720157623292
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,6144,2560,8,160,16,2,balanced,4.284629185994466
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,6144,2560,8,160,16,2,balanced,3.7856906255086265
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,6144,2560,8,160,16,2,power_law_1.2,0.26369280815124513
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,6144,2560,8,160,16,2,power_law_1.01,1.8704000473022462
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,6144,2560,8,160,16,2,balanced,7.311285018920898
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,6144,2560,8,160,16,2,power_law_1.2,0.3105792045593262
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,6144,2560,8,160,16,2,power_law_1.01,2.386137580871582
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,6144,2560,8,160,16,2,power_law_1.2,0.3401599884033203
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,6144,2560,8,160,16,2,power_law_1.01,3.650969696044922
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,6144,2560,8,160,16,2,power_law_1.2,0.41780481338500974
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,6144,2560,8,160,16,2,power_law_1.01,4.998118209838867
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,6144,2560,8,160,16,2,power_law_1.2,0.4778560161590576
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,6144,2560,8,160,16,2,power_law_1.2,0.6510528087615967
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,6144,2560,8,160,16,2,power_law_1.01,6.012390518188477
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,6144,2560,8,160,16,2,power_law_1.2,0.8666367530822754
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,6144,2560,8,160,16,2,balanced,5.243610699971517
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,6144,2560,8,160,16,2,power_law_1.01,8.831161499023438
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,6144,2560,8,160,16,2,power_law_1.2,1.0406911849975586
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,6144,2560,8,160,16,2,power_law_1.2,1.281760025024414
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,6144,2560,8,160,16,2,power_law_1.01,18.60377655029297
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,6144,2560,8,160,16,2,power_law_1.2,2.145523262023926
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,6144,2560,8,160,16,2,power_law_1.2,2.3963903427124023
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,6144,2560,8,160,16,2,power_law_1.2,3.03623046875
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,6144,2560,8,160,16,2,power_law_1.2,4.687641525268555
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,6144,2560,8,160,16,2,power_law_1.2,0.0514303982257843
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,6144,2560,8,160,16,2,power_law_1.2,10.437139129638672
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,6144,2560,8,160,16,2,power_law_1.2,0.052249598503112796
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,6144,2560,8,160,16,2,power_law_1.2,0.0580672025680542
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,6144,2560,8,160,16,2,balanced,8.37710952758789
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,6144,2560,8,160,16,2,power_law_1.2,0.06993280053138733
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,6144,2560,8,160,16,2,power_law_1.2,0.07891200184822082
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,6144,2560,8,160,16,2,balanced,7.4303944905598955
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,6144,2560,8,160,16,2,power_law_1.2,0.11373440027236939
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,6144,2560,8,160,16,2,power_law_1.2,0.1252992033958435
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,6144,2560,8,160,16,2,power_law_1.2,0.1230463981628418
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,6144,2560,8,160,16,2,power_law_1.2,0.13404799699783326
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,6144,2560,8,160,16,2,power_law_1.2,0.13615360260009765
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,6144,2560,8,160,16,2,power_law_1.2,0.14199039936065674
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,6144,2560,8,160,16,2,power_law_1.2,0.14831360578536987
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,6144,2560,8,160,16,2,power_law_1.2,0.15854719877243043
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,6144,2560,8,160,16,2,power_law_1.2,0.1628864049911499
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,6144,2560,8,160,16,2,power_law_1.2,0.1829568028450012
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,6144,2560,8,160,16,2,power_law_1.2,0.19288320541381837
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,6144,2560,8,160,16,2,power_law_1.2,0.20646400451660157
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,6144,2560,8,160,16,2,power_law_1.2,0.2646656036376953
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,6144,2560,8,160,16,2,power_law_1.2,0.27340800762176515
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,6144,2560,8,160,16,2,power_law_1.2,0.34840960502624513
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,6144,2560,8,160,16,2,power_law_1.2,0.39894399642944334
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,6144,2560,8,160,16,2,power_law_1.2,0.5251711845397949
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,6144,2560,8,160,16,2,power_law_1.2,0.7342976093292236
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,6144,2560,8,160,16,2,power_law_1.2,0.9561663627624511
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,6144,2560,8,160,16,2,power_law_1.2,1.2699711799621582
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,6144,2560,8,160,16,2,power_law_1.2,1.767430305480957
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,6144,2560,8,160,16,2,power_law_1.2,2.256287956237793
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,6144,2560,8,160,16,2,balanced,16.598400115966797
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,6144,2560,8,160,16,2,power_law_1.2,2.9346687316894533
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,6144,2560,8,160,16,2,power_law_1.2,4.7713470458984375
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,6144,2560,8,160,16,2,power_law_1.2,0.06520320177078247
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,6144,2560,8,160,32,1,balanced,0.06593066453933716
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,6144,2560,8,160,16,2,power_law_1.2,0.06940799951553345
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,6144,2560,8,160,16,2,power_law_1.2,8.804512023925781
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,6144,2560,8,160,32,1,balanced,0.06642666459083557
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,6144,2560,8,160,16,2,power_law_1.2,0.07783679962158203
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,6144,2560,8,160,32,1,balanced,0.08463467160860698
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,6144,2560,8,160,32,1,balanced,0.11489066481590271
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,6144,2560,8,160,16,2,power_law_1.2,0.08608639836311341
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,6144,2560,8,160,32,1,balanced,0.1795039971669515
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,6144,2560,8,160,16,2,power_law_1.2,0.09513599872589111
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,6144,2560,8,160,32,1,balanced,0.2313013275464376
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,6144,2560,8,160,32,1,balanced,0.23496532440185547
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,6144,2560,8,160,16,2,power_law_1.2,0.13137279748916625
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,6144,2560,8,160,32,1,balanced,0.22719999154408774
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,6144,2560,8,160,32,1,balanced,0.2285226583480835
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,6144,2560,8,160,16,2,power_law_1.2,0.1420032024383545
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,6144,2560,8,160,32,1,balanced,0.23530133565266928
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,6144,2560,8,160,32,1,balanced,0.2342026631037394
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,6144,2560,8,160,16,2,power_law_1.2,0.14781440496444703
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,6144,2560,8,160,32,1,balanced,0.2396799921989441
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,6144,2560,8,160,32,1,balanced,0.24353599548339844
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,6144,2560,8,160,16,2,power_law_1.2,0.1539072036743164
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,6144,2560,8,160,32,1,balanced,0.25249600410461426
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,6144,2560,8,160,16,2,power_law_1.2,0.15918079614639283
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,6144,2560,8,160,32,1,balanced,0.26130133867263794
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,6144,2560,8,160,32,1,balanced,0.31842132409413654
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,6144,2560,8,160,16,2,power_law_1.2,0.1781440019607544
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,6144,2560,8,160,32,1,balanced,0.2849386731783549
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,6144,2560,8,160,16,2,power_law_1.2,0.19134080410003662
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,6144,2560,8,160,32,1,balanced,0.43929600715637207
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,6144,2560,8,160,16,2,power_law_1.2,0.19954559803009034
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,6144,2560,8,160,32,1,balanced,0.3803733189900716
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,6144,2560,8,160,16,2,power_law_1.2,0.21835520267486572
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,6144,2560,8,160,16,2,power_law_1.2,0.24506878852844238
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,6144,2560,8,160,32,1,balanced,0.5026559829711914
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,6144,2560,8,160,32,1,balanced,0.52128533522288
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,6144,2560,8,160,16,2,power_law_1.2,0.2566335916519165
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,6144,2560,8,160,32,1,balanced,0.8184053103129069
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,6144,2560,8,160,16,2,power_law_1.2,0.29155840873718264
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,6144,2560,8,160,32,1,balanced,0.9846986929575602
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,6144,2560,8,160,16,2,power_law_1.2,0.3779968023300171
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,6144,2560,8,160,32,1,balanced,1.4588534037272136
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,6144,2560,8,160,32,1,balanced,0.055888002117474876
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,6144,2560,8,160,16,2,power_law_1.2,0.4562240123748779
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,6144,2560,8,160,16,2,power_law_1.2,0.5902463912963867
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,6144,2560,8,160,32,1,balanced,0.05892266829808553
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,6144,2560,8,160,32,1,balanced,0.07027199864387512
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,6144,2560,8,160,16,2,power_law_1.2,0.7548160076141357
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,6144,2560,8,160,32,1,balanced,0.09962667028109233
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,6144,2560,8,160,32,1,balanced,1.826149304707845
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,6144,2560,8,160,16,2,power_law_1.2,1.113913631439209
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,6144,2560,8,160,32,1,balanced,0.1474240024884542
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,6144,2560,8,160,32,1,balanced,0.17548267046610513
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,6144,2560,8,160,16,2,power_law_1.2,1.2781951904296875
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,6144,2560,8,160,32,1,balanced,0.17850132783253989
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,6144,2560,8,160,16,2,power_law_1.2,1.9693824768066406
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,6144,2560,8,160,32,1,balanced,0.17891200383504233
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,6144,2560,8,160,16,2,power_law_1.2,2.475654411315918
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,6144,2560,8,160,32,1,balanced,0.18268267313639322
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,6144,2560,8,160,32,1,balanced,0.18504534165064493
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,6144,2560,8,160,16,2,power_law_1.2,3.807027053833008
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,6144,2560,8,160,32,1,balanced,2.692240079243978
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,6144,2560,8,160,32,1,balanced,0.18725866079330444
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,6144,2560,8,160,16,2,power_law_1.2,5.008966445922852
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,6144,2560,8,160,32,1,balanced,0.19221866130828857
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,6144,2560,8,160,32,1,balanced,0.1981226603190104
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,6144,2560,8,160,16,2,power_law_1.2,6.4390716552734375
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,6144,2560,8,160,32,1,balanced,0.20915732781092325
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,6144,2560,8,160,16,2,power_law_1.2,10.042092895507812
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,6144,2560,8,160,32,1,balanced,0.21850667397181192
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,6144,2560,8,160,32,1,balanced,0.2381653388341268
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,6144,2560,8,160,32,1,balanced,3.3709065119425454
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,6144,2560,8,160,32,1,balanced,0.26038400332132977
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,6144,2560,8,160,16,2,power_law_1.2,23.031283569335937
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,6144,2560,8,160,32,1,balanced,0.41677868366241455
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,6144,2560,8,160,32,1,balanced,0.33568533261617023
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,6144,2560,8,160,32,1,balanced,0.4383253256479899
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,6144,2560,8,160,32,1,balanced,0.48257601261138916
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,6144,2560,8,160,32,1,power_law_1.01,0.06381440162658691
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,6144,2560,8,160,32,1,power_law_1.01,0.05430399775505066
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,6144,2560,8,160,32,1,power_law_1.01,0.06214399933815003
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,6144,2560,8,160,32,1,balanced,3.9902187983194985
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,6144,2560,8,160,32,1,power_law_1.01,0.055622398853302
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,6144,2560,8,160,32,1,balanced,0.7859573364257812
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,6144,2560,8,160,32,1,power_law_1.01,0.07597439885139465
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,6144,2560,8,160,32,1,power_law_1.01,0.06658560037612915
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,6144,2560,8,160,32,1,power_law_1.01,0.09359999895095825
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,6144,2560,8,160,32,1,power_law_1.01,0.08324480056762695
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,6144,2560,8,160,32,1,balanced,0.9247519969940186
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,6144,2560,8,160,32,1,power_law_1.01,0.12768640518188476
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,6144,2560,8,160,32,1,power_law_1.01,0.10262399911880493
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,6144,2560,8,160,32,1,power_law_1.01,0.13982080221176146
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,6144,2560,8,160,32,1,power_law_1.01,0.16830079555511473
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,6144,2560,8,160,32,1,power_law_1.01,0.1540544033050537
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,6144,2560,8,160,32,1,power_law_1.01,0.1919487953186035
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,6144,2560,8,160,32,1,power_law_1.01,0.15911680459976196
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,6144,2560,8,160,32,1,power_law_1.01,0.18932479619979858
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,6144,2560,8,160,32,1,balanced,1.444474697113037
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,6144,2560,8,160,32,1,power_law_1.01,0.1630079984664917
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,6144,2560,8,160,32,1,power_law_1.01,0.20554239749908448
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,6144,2560,8,160,32,1,power_law_1.01,0.1729856014251709
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,6144,2560,8,160,32,1,power_law_1.01,0.21892480850219725
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,6144,2560,8,160,32,1,power_law_1.01,0.18427519798278807
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,6144,2560,8,160,32,1,power_law_1.01,0.21687040328979493
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,6144,2560,8,160,32,1,power_law_1.01,0.19864959716796876
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,6144,2560,8,160,32,1,power_law_1.01,0.2130944013595581
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,6144,2560,8,160,32,1,power_law_1.01,0.22929279804229735
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,6144,2560,8,160,32,1,balanced,1.8053545951843262
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,6144,2560,8,160,32,1,power_law_1.01,0.2198335886001587
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,6144,2560,8,160,32,1,power_law_1.01,0.2400576114654541
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,6144,2560,8,160,32,1,power_law_1.01,0.23832321166992188
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,6144,2560,8,160,32,1,balanced,6.365749359130859
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,6144,2560,8,160,32,1,power_law_1.01,0.27267839908599856
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,6144,2560,8,160,32,1,power_law_1.01,0.26141440868377686
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,6144,2560,8,160,32,1,power_law_1.01,0.29368319511413576
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,6144,2560,8,160,32,1,power_law_1.01,0.3038719892501831
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,6144,2560,8,160,32,1,power_law_1.01,0.32616961002349854
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,6144,2560,8,160,32,1,power_law_1.01,0.373523211479187
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,6144,2560,8,160,32,1,power_law_1.01,0.37093119621276854
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,6144,2560,8,160,32,1,power_law_1.01,0.33172481060028075
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,6144,2560,8,160,32,1,balanced,2.6693814595540366
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,6144,2560,8,160,32,1,power_law_1.01,0.4670720100402832
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,6144,2560,8,160,32,1,power_law_1.01,0.4249983787536621
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,6144,2560,8,160,32,1,power_law_1.01,0.5750656127929688
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,6144,2560,8,160,32,1,power_law_1.01,0.4274752140045166
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,6144,2560,8,160,32,1,power_law_1.01,0.7563583850860596
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,6144,2560,8,160,32,1,power_law_1.01,0.5310592174530029
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,6144,2560,8,160,32,1,power_law_1.01,0.9641087532043457
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,6144,2560,8,160,32,1,power_law_1.01,0.6067584037780762
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,6144,2560,8,160,32,1,power_law_1.01,1.3514112472534179
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,6144,2560,8,160,32,1,power_law_1.01,0.7931583881378174
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,6144,2560,8,160,32,1,power_law_1.01,1.6824895858764648
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,6144,2560,8,160,32,1,power_law_1.01,0.9896448135375977
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,6144,2560,8,160,32,1,power_law_1.01,1.3942720413208007
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,6144,2560,8,160,32,1,power_law_1.01,2.4986240386962892
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,6144,2560,8,160,32,1,balanced,3.311573346455892
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,6144,2560,8,160,32,1,power_law_1.01,1.7629632949829102
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,6144,2560,8,160,32,1,power_law_1.2,0.06366080045700073
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,6144,2560,8,160,32,1,power_law_1.01,3.2270015716552733
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,6144,2560,8,160,32,1,power_law_1.01,2.5714431762695313
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,6144,2560,8,160,32,1,power_law_1.2,0.060185599327087405
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,6144,2560,8,160,32,1,power_law_1.01,3.992435073852539
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,6144,2560,8,160,32,1,power_law_1.2,0.06989439725875854
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,6144,2560,8,160,32,1,power_law_1.01,3.285715103149414
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,6144,2560,8,160,32,1,power_law_1.01,6.49486083984375
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,6144,2560,8,160,32,1,power_law_1.2,0.08950399756431579
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,6144,2560,8,160,32,1,power_law_1.01,4.056185531616211
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,6144,2560,8,160,32,1,power_law_1.2,0.11902719736099243
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,6144,2560,8,160,32,1,power_law_1.01,6.73022689819336
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,6144,2560,8,160,32,1,power_law_1.01,13.644908142089843
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,6144,2560,8,160,32,1,power_law_1.2,0.17108479738235474
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,6144,2560,8,160,32,1,power_law_1.2,0.1920192003250122
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,6144,2560,8,160,32,1,balanced,4.016186714172363
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,6144,2560,8,160,32,1,power_law_1.01,13.754322814941407
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,6144,2560,8,160,32,1,power_law_1.2,0.2033535957336426
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,6144,2560,8,160,32,1,power_law_1.2,0.21383039951324462
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,6144,2560,8,160,32,1,power_law_1.2,0.22568318843841553
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,6144,2560,8,160,32,1,power_law_1.2,0.22994558811187743
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,6144,2560,8,160,32,1,balanced,12.78265635172526
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,6144,2560,8,160,32,1,power_law_1.2,0.23917438983917236
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,6144,2560,8,160,32,1,power_law_1.2,0.25350399017333985
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,6144,2560,8,160,32,1,power_law_1.2,0.277894401550293
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,6144,2560,8,160,32,1,power_law_1.2,0.3065023899078369
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,6144,2560,8,160,32,1,power_law_1.2,0.3346175909042358
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,6144,2560,8,160,32,1,power_law_1.2,0.3368256092071533
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,6144,2560,8,160,32,1,power_law_1.2,0.4307712078094482
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,6144,2560,8,160,32,1,power_law_1.2,0.4366144180297852
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,6144,2560,8,160,32,1,balanced,6.35693359375
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,6144,2560,8,160,32,1,power_law_1.2,0.5494336128234864
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,6144,2560,8,160,32,1,power_law_1.2,0.6144063949584961
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,6144,2560,8,160,32,1,power_law_1.2,0.8051775932312012
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,6144,2560,8,160,32,1,power_law_1.2,1.010688018798828
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,6144,2560,8,160,32,1,power_law_1.2,1.4326911926269532
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,6144,2560,8,160,32,1,power_law_1.2,1.7984384536743163
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,6144,2560,8,160,32,1,power_law_1.2,2.6146303176879884
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,6144,2560,8,160,32,1,power_law_1.2,3.3563007354736327
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,6144,2560,8,160,32,1,power_law_1.2,4.143494415283203
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,6144,2560,8,160,32,1,power_law_1.2,6.854892730712891
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,6144,2560,8,160,32,1,power_law_1.2,13.952685546875
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,6144,2560,8,160,32,1,power_law_1.2,0.05438079833984375
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,6144,2560,8,160,32,1,power_law_1.2,0.054655998945236206
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,6144,2560,8,160,32,1,power_law_1.2,0.06405119895935059
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,6144,2560,8,160,32,1,balanced,12.564618428548178
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,6144,2560,8,160,32,1,power_law_1.2,0.07962239980697632
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,6144,2560,8,160,32,1,power_law_1.2,0.09374719858169556
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,6144,2560,8,160,32,1,power_law_1.2,0.1397312045097351
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,6144,2560,8,160,32,1,power_law_1.2,0.15162880420684816
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,6144,2560,8,160,32,1,power_law_1.2,0.16389119625091553
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,6144,2560,8,160,32,1,power_law_1.2,0.17457280158996583
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,6144,2560,8,160,32,1,power_law_1.2,0.17863039970397948
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,6144,2560,8,160,32,1,power_law_1.2,0.1931007981300354
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,6144,2560,8,160,32,1,power_law_1.2,0.201964807510376
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,6144,2560,8,160,32,1,power_law_1.2,0.22290558815002443
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,6144,2560,8,160,32,1,power_law_1.2,0.22495360374450685
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,6144,2560,8,160,32,1,power_law_1.2,0.24739201068878175
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,6144,2560,8,160,32,1,power_law_1.2,0.26626560688018797
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,6144,2560,8,160,32,1,power_law_1.2,0.30663039684295657
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,6144,2560,8,160,32,1,power_law_1.2,0.3817728042602539
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,6144,2560,8,160,32,1,power_law_1.2,0.380128002166748
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,6144,2560,8,160,32,1,power_law_1.2,0.4787136077880859
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,6144,2560,8,160,32,1,power_law_1.2,0.5885183811187744
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,6144,2560,8,160,32,1,power_law_1.2,0.7733695983886719
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,6144,2560,8,160,32,1,power_law_1.2,0.9744511604309082
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,6144,2560,8,160,32,1,power_law_1.2,1.3701312065124511
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,6144,2560,8,160,32,1,power_law_1.2,1.7147903442382812
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,6144,2560,8,160,32,1,power_law_1.2,2.5400896072387695
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,6144,2560,8,160,32,1,power_law_1.2,3.295462417602539
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,6144,2560,8,160,32,1,power_law_1.2,4.05269775390625
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,6144,2560,8,160,32,1,power_law_1.2,6.7825981140136715
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,6144,2560,8,160,32,1,power_law_1.2,13.753683471679688
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,7168,2048,8,384,1,32,balanced,0.11781332890192668
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,7168,2048,8,384,1,32,balanced,0.18994667132695517
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,7168,2048,8,384,1,32,balanced,0.11866133411725362
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,7168,2048,8,384,1,32,balanced,0.18910932540893555
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,7168,2048,8,384,1,32,balanced,0.12410666545232137
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,7168,2048,8,384,1,32,balanced,0.18819733460744223
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,7168,2048,8,384,1,32,balanced,0.2140373388926188
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,7168,2048,8,384,1,32,balanced,0.3479893207550049
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,7168,2048,8,384,1,32,balanced,0.3821866512298584
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,7168,2048,8,384,1,32,balanced,0.6843840281168619
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,7168,2048,8,384,1,32,balanced,0.7002986272176107
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,7168,2048,8,384,1,32,balanced,0.9706292947133383
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,7168,2048,8,384,1,32,balanced,1.2677866617838542
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,7168,2048,8,384,1,32,balanced,0.9546826680501302
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,7168,2048,8,384,1,32,balanced,1.8022987047831218
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,7168,2048,8,384,1,32,balanced,1.0204266707102458
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,7168,2048,8,384,1,32,balanced,1.87828795115153
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,7168,2048,8,384,1,32,balanced,0.9431680043538412
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,7168,2048,8,384,1,32,balanced,1.8987785975138347
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,7168,2048,8,384,1,32,balanced,0.990447998046875
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,7168,2048,8,384,1,32,balanced,1.8377866744995117
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,7168,2048,8,384,1,32,balanced,1.0225599606831868
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,7168,2048,8,384,1,32,balanced,1.953920046488444
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,7168,2048,8,384,1,32,balanced,0.9998506704966227
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,7168,2048,8,384,1,32,power_law_1.01,1.2633279800415038
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,7168,2048,8,384,1,32,balanced,1.8926186561584473
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,7168,2048,8,384,1,32,balanced,0.9596266746520996
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,7168,2048,8,384,1,32,balanced,1.8992212613423665
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,7168,2048,8,384,1,32,power_law_1.01,1.8627071380615234
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,7168,2048,8,384,1,32,balanced,1.0316267013549805
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,7168,2048,8,384,1,32,balanced,1.9132053057352703
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,7168,2048,8,384,1,32,balanced,0.050160000721613564
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,7168,2048,8,384,1,32,power_law_1.01,1.843609619140625
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,7168,2048,8,384,1,32,balanced,1.0231359799702961
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,7168,2048,8,384,1,32,balanced,1.7810133298238118
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,7168,2048,8,384,1,32,balanced,0.05078400174776713
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,7168,2048,8,384,1,32,power_law_1.01,0.6049471855163574
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,7168,2048,8,384,1,32,balanced,1.07259202003479
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,7168,2048,8,384,1,32,balanced,1.9065334002176921
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,7168,2048,8,384,1,32,balanced,0.05145066479841868
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,7168,2048,8,384,1,32,power_law_1.01,1.0289983749389648
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,7168,2048,8,384,1,32,balanced,0.9878506660461426
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,7168,2048,8,384,1,32,balanced,1.78002134958903
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,7168,2048,8,384,1,32,balanced,0.0683840016523997
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,7168,2048,8,384,1,32,power_law_1.01,1.069267177581787
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,7168,2048,8,384,1,32,balanced,0.08949866890907288
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,7168,2048,8,384,1,32,balanced,1.7673600514729817
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,7168,2048,8,384,1,32,balanced,0.9400533040364584
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,7168,2048,8,384,1,32,power_law_1.01,1.4020544052124024
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,7168,2048,8,384,1,32,balanced,0.12948266665140787
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,7168,2048,8,384,1,32,balanced,1.7953972816467285
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,7168,2048,8,384,1,32,balanced,0.9324639638264974
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,7168,2048,8,384,1,32,balanced,0.17106133699417114
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,7168,2048,8,384,1,32,power_law_1.01,1.5481663703918458
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,7168,2048,8,384,1,32,balanced,0.17226133743921915
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,7168,2048,8,384,1,32,balanced,1.7936053276062012
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,7168,2048,8,384,1,32,power_law_1.01,1.507583999633789
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,7168,2048,8,384,1,32,balanced,0.9543786843617758
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,7168,2048,8,384,1,32,balanced,0.17285333077112833
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,7168,2048,8,384,1,32,power_law_1.01,1.548851203918457
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,7168,2048,8,384,1,32,balanced,0.17417067289352417
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,7168,2048,8,384,1,32,balanced,1.6585920651753743
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,7168,2048,8,384,1,32,balanced,0.17432532707850137
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,7168,2048,8,384,1,32,balanced,0.9411146640777588
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,7168,2048,8,384,1,32,power_law_1.01,1.6081792831420898
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,7168,2048,8,384,1,32,balanced,0.17726399501164755
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,7168,2048,8,384,1,32,balanced,1.594831943511963
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,7168,2048,8,384,1,32,power_law_1.01,1.4922880172729491
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,7168,2048,8,384,1,32,power_law_1.01,0.7295936107635498
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,7168,2048,8,384,1,32,balanced,0.17821866273880005
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,7168,2048,8,384,1,32,balanced,0.8742240269978842
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,7168,2048,8,384,1,32,power_law_1.01,1.6503488540649414
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,7168,2048,8,384,1,32,balanced,0.17940799395243326
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,7168,2048,8,384,1,32,power_law_1.01,1.0144960403442382
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,7168,2048,8,384,1,32,balanced,0.18701332807540894
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,7168,2048,8,384,1,32,balanced,1.3758986790974934
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,7168,2048,8,384,1,32,power_law_1.01,1.609107208251953
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,7168,2048,8,384,1,32,power_law_1.01,1.0265791893005372
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,7168,2048,8,384,1,32,balanced,0.18862932920455933
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,7168,2048,8,384,1,32,power_law_1.01,0.30174078941345217
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,7168,2048,8,384,1,32,power_law_1.01,1.5568960189819336
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,7168,2048,8,384,1,32,power_law_1.01,0.48244481086730956
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,7168,2048,8,384,1,32,balanced,0.6906186739603678
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,7168,2048,8,384,1,32,balanced,0.19412267208099365
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,7168,2048,8,384,1,32,power_law_1.01,1.6272127151489257
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,7168,2048,8,384,1,32,power_law_1.01,0.5730559825897217
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,7168,2048,8,384,1,32,balanced,0.9722186724344889
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,7168,2048,8,384,1,32,balanced,0.20622400442759195
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,7168,2048,8,384,1,32,power_law_1.01,0.5994751930236817
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,7168,2048,8,384,1,32,power_law_1.01,1.6482688903808593
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,7168,2048,8,384,1,32,power_law_1.01,0.7777472019195557
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,7168,2048,8,384,1,32,power_law_1.01,1.4554431915283204
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,7168,2048,8,384,1,32,power_law_1.01,0.8480128288269043
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,7168,2048,8,384,1,32,balanced,1.720314661661784
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,7168,2048,8,384,1,32,power_law_1.01,0.8847743988037109
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,7168,2048,8,384,1,32,power_law_1.01,1.8201343536376953
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,7168,2048,8,384,1,32,power_law_1.01,0.7497407913208007
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,7168,2048,8,384,1,32,balanced,2.8760105768839517
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,7168,2048,8,384,1,32,power_law_1.01,1.918764877319336
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,7168,2048,8,384,1,32,power_law_1.01,0.7913536071777344
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,384,1,32,balanced,0.2201333244641622
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,7168,2048,8,384,1,32,power_law_1.01,1.9199359893798829
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,7168,2048,8,384,1,32,power_law_1.01,0.8735424041748047
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,7168,2048,8,384,1,32,power_law_1.01,0.8381183624267579
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,7168,2048,8,384,1,32,power_law_1.01,2.4403007507324217
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,7168,2048,8,384,1,32,power_law_1.01,0.7765312194824219
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,7168,2048,8,384,1,32,power_law_1.01,2.731328010559082
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,7168,2048,8,384,1,32,power_law_1.01,0.9593279838562012
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,7168,2048,8,384,1,32,balanced,1.2916320164998372
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,7168,2048,8,384,1,32,power_law_1.01,0.8179519653320313
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,7168,2048,8,384,1,32,power_law_1.01,3.374323272705078
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,7168,2048,8,384,1,32,balanced,1.8843520482381184
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,7168,2048,8,384,1,32,power_law_1.01,0.8990976333618164
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,7168,2048,8,384,1,32,power_law_1.01,0.9088768005371094
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,7168,2048,8,384,1,32,power_law_1.01,4.209740829467774
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,384,1,32,balanced,0.24593599637349448
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,7168,2048,8,384,1,32,power_law_1.01,1.0623167991638183
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,7168,2048,8,384,1,32,power_law_1.01,5.74835205078125
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,7168,2048,8,384,1,32,power_law_1.01,1.1257216453552246
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,7168,2048,8,384,1,32,power_law_1.01,0.14057600498199463
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,384,1,32,balanced,0.26797332366307575
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,7168,2048,8,384,1,32,power_law_1.01,1.2434752464294434
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,7168,2048,8,384,1,32,power_law_1.01,7.287513732910156
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,7168,2048,8,384,1,32,power_law_1.01,1.563212776184082
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,7168,2048,8,384,1,32,power_law_1.01,0.17191040515899658
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,7168,2048,8,384,1,32,balanced,2.2820107142130532
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,7168,2048,8,384,1,32,power_law_1.01,2.034841537475586
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,384,1,32,balanced,0.30853867530822754
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,7168,2048,8,384,1,32,power_law_1.01,0.16698240041732787
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,7168,2048,8,384,1,32,power_law_1.01,8.770432281494141
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,7168,2048,8,384,1,32,power_law_1.01,2.656051254272461
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,7168,2048,8,384,1,32,power_law_1.01,0.08335360288619995
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,7168,2048,8,384,1,32,balanced,3.5265814463297525
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,7168,2048,8,384,1,32,power_law_1.01,3.468396759033203
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,7168,2048,8,384,1,32,power_law_1.01,0.10279040336608887
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,7168,2048,8,384,1,32,power_law_1.01,14.920576477050782
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,7168,2048,8,384,1,32,power_law_1.01,4.450502395629883
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,7168,2048,8,384,1,32,power_law_1.01,0.11845760345458985
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,7168,2048,8,384,1,32,power_law_1.01,4.9960063934326175
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,7168,2048,8,384,1,32,power_law_1.01,0.12384639978408814
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,384,1,32,balanced,0.36292799313863117
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,7168,2048,8,384,1,32,power_law_1.01,0.13893120288848876
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,7168,2048,8,384,1,32,power_law_1.01,7.498067474365234
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,7168,2048,8,384,1,32,power_law_1.01,31.981869506835938
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,7168,2048,8,384,1,32,power_law_1.01,0.15699199438095093
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,7168,2048,8,384,1,32,power_law_1.01,0.1591231942176819
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,7168,2048,8,384,1,32,power_law_1.01,14.201747131347656
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,7168,2048,8,384,1,32,balanced,3.1549011866251626
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,7168,2048,8,384,1,32,power_law_1.01,0.15568000078201294
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,384,1,32,balanced,0.4461919864018758
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,7168,2048,8,384,1,32,power_law_1.01,0.16640000343322753
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,7168,2048,8,384,1,32,balanced,5.14851729075114
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,7168,2048,8,384,1,32,power_law_1.01,0.1852735996246338
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,7168,2048,8,384,1,32,power_law_1.2,1.2594112396240233
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,7168,2048,8,384,1,32,power_law_1.01,0.18592000007629395
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,7168,2048,8,384,1,32,power_law_1.01,0.19417599439620972
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,7168,2048,8,384,1,32,power_law_1.2,1.820889663696289
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,7168,2048,8,384,1,32,power_law_1.01,0.21069440841674805
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,384,1,32,balanced,0.6241866747538248
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,7168,2048,8,384,1,32,power_law_1.2,1.8486656188964843
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,7168,2048,8,384,1,32,power_law_1.01,0.23685119152069092
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,7168,2048,8,384,1,32,power_law_1.01,0.272492790222168
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,7168,2048,8,384,1,32,power_law_1.2,0.615558385848999
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,7168,2048,8,384,1,32,power_law_1.2,0.9030719757080078
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,384,1,32,power_law_1.01,0.2835007905960083
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,7168,2048,8,384,1,32,power_law_1.2,0.93306884765625
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,7168,2048,8,384,1,32,balanced,4.547418594360352
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,384,1,32,balanced,0.8086880048116049
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,7168,2048,8,384,1,32,power_law_1.2,1.0178496360778808
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,7168,2048,8,384,1,32,power_law_1.2,0.7069632053375244
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,384,1,32,power_law_1.01,0.3040127992630005
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,7168,2048,8,384,1,32,power_law_1.2,1.350553607940674
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,7168,2048,8,384,1,32,balanced,7.329850514729817
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,384,1,32,power_law_1.01,0.35582718849182127
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,7168,2048,8,384,1,32,power_law_1.2,1.0112000465393067
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,7168,2048,8,384,1,32,power_law_1.2,1.4698047637939453
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,384,1,32,power_law_1.01,0.4867712020874023
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,7168,2048,8,384,1,32,power_law_1.2,0.9500032424926758
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,7168,2048,8,384,1,32,power_law_1.2,0.30049920082092285
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,7168,2048,8,384,1,32,power_law_1.2,1.4395456314086914
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,384,1,32,power_law_1.01,0.5444416046142578
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,7168,2048,8,384,1,32,power_law_1.2,0.48282880783081056
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,7168,2048,8,384,1,32,power_law_1.2,1.583347225189209
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,384,1,32,balanced,1.09988268216451
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,384,1,32,power_law_1.01,0.7685247898101807
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,7168,2048,8,384,1,32,power_law_1.2,0.558899211883545
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,7168,2048,8,384,1,32,power_law_1.2,1.5905535697937012
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,7168,2048,8,384,1,32,power_law_1.2,0.663647985458374
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,384,1,32,power_law_1.01,1.1022272109985352
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,7168,2048,8,384,1,32,power_law_1.2,1.5788415908813476
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,7168,2048,8,384,1,32,power_law_1.2,0.873964786529541
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,384,1,32,power_law_1.01,1.4773311614990234
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,7168,2048,8,384,1,32,power_law_1.2,1.4168000221252441
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,7168,2048,8,384,1,32,power_law_1.2,0.7922431945800781
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,7168,2048,8,384,1,32,power_law_1.2,0.8187456130981445
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,384,1,32,power_law_1.01,1.9533248901367188
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,7168,2048,8,384,1,32,power_law_1.2,1.667487907409668
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,7168,2048,8,384,1,32,power_law_1.2,0.8053824424743652
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,7168,2048,8,384,1,32,power_law_1.2,1.4511167526245117
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,384,1,32,power_law_1.01,2.163257598876953
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,7168,2048,8,384,1,32,power_law_1.2,0.7274943828582764
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,384,1,32,balanced,1.3871359825134277
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,7168,2048,8,384,1,32,power_law_1.2,1.598681640625
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,384,1,32,power_law_1.01,3.9991744995117187
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,7168,2048,8,384,1,32,power_law_1.2,0.9308287620544433
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,7168,2048,8,384,1,32,power_law_1.2,1.626950454711914
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,7168,2048,8,384,1,32,power_law_1.2,0.7997312068939209
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,384,1,32,power_law_1.01,7.399769592285156
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,7168,2048,8,384,1,32,power_law_1.2,1.8069952011108399
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,7168,2048,8,384,1,32,power_law_1.2,0.800716781616211
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,7168,2048,8,384,1,32,power_law_1.2,2.025094413757324
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,7168,2048,8,384,1,32,power_law_1.2,0.8332032203674317
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,7168,2048,8,384,1,32,power_law_1.2,2.2504575729370115
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,7168,2048,8,384,1,32,power_law_1.2,0.8730048179626465
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,7168,2048,8,384,1,32,power_law_1.2,2.8936832427978514
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,7168,2048,8,384,1,32,power_law_1.2,0.8680319786071777
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,7168,2048,8,384,1,32,power_law_1.2,3.285932922363281
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,7168,2048,8,384,1,32,balanced,7.864992141723633
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,7168,2048,8,384,1,32,power_law_1.2,0.9430208206176758
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,7168,2048,8,384,1,32,power_law_1.2,1.1097087860107422
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,7168,2048,8,384,1,32,power_law_1.2,4.200864028930664
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,7168,2048,8,384,1,32,power_law_1.2,1.3515904426574707
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,7168,2048,8,384,1,32,balanced,12.216442108154297
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,7168,2048,8,384,1,32,power_law_1.2,5.351244735717773
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,7168,2048,8,384,1,32,power_law_1.2,1.5210623741149902
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,384,1,32,balanced,2.1629865964253745
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,7168,2048,8,384,1,32,power_law_1.2,1.7194751739501952
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,7168,2048,8,384,1,32,power_law_1.2,7.9372413635253904
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,7168,2048,8,384,1,32,power_law_1.2,2.5567935943603515
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,7168,2048,8,384,1,32,power_law_1.2,9.595801544189452
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,7168,2048,8,384,1,32,power_law_1.2,2.805836868286133
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,7168,2048,8,384,1,32,power_law_1.2,4.304313659667969
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,7168,2048,8,384,1,32,power_law_1.2,13.138003540039062
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,7168,2048,8,384,1,32,power_law_1.2,6.112556838989258
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,7168,2048,8,384,1,32,power_law_1.2,6.711686706542968
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,7168,2048,8,384,1,32,power_law_1.2,21.374490356445314
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,7168,2048,8,384,1,32,power_law_1.2,12.092838287353516
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,7168,2048,8,384,1,32,power_law_1.2,44.851296997070314
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,7168,2048,8,384,1,32,power_law_1.2,21.900941467285158
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,384,1,32,balanced,4.193269411722819
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,7168,2048,8,384,2,16,balanced,0.06885333359241486
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,7168,2048,8,384,2,16,balanced,0.05956799785296122
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,7168,2048,8,384,2,16,balanced,0.06554666658242543
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,7168,2048,8,384,2,16,balanced,0.08646933237711589
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,7168,2048,8,384,1,32,power_law_1.2,0.14072320461273194
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,7168,2048,8,384,2,16,balanced,0.1265120009581248
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,7168,2048,8,384,2,16,balanced,0.20517865816752115
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,7168,2048,8,384,1,32,power_law_1.2,0.17189760208129884
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,7168,2048,8,384,2,16,balanced,0.28946133454640705
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,7168,2048,8,384,1,32,power_law_1.2,0.15652480125427246
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,7168,2048,8,384,2,16,balanced,0.292522668838501
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,7168,2048,8,384,1,32,power_law_1.2,0.08046720027923585
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,7168,2048,8,384,2,16,balanced,0.29063467184702557
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,7168,2048,8,384,1,32,power_law_1.2,0.11245440244674683
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,7168,2048,8,384,2,16,balanced,0.2950719992319743
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,7168,2048,8,384,1,32,power_law_1.2,0.1130944013595581
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,7168,2048,8,384,2,16,balanced,0.29385600487391156
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,7168,2048,8,384,1,32,power_law_1.2,0.11900160312652588
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,7168,2048,8,384,2,16,balanced,0.29759466648101807
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,7168,2048,8,384,2,16,balanced,0.2987733284632365
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,7168,2048,8,384,1,32,power_law_1.2,0.1438912034034729
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,7168,2048,8,384,2,16,balanced,0.2995786666870117
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,7168,2048,8,384,1,32,power_law_1.2,0.14153599739074707
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,7168,2048,8,384,2,16,balanced,0.3056640028953552
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,7168,2048,8,384,1,32,power_law_1.2,0.15279359817504884
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,7168,2048,8,384,2,16,balanced,0.3073546687761943
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,7168,2048,8,384,1,32,power_law_1.2,0.1559615969657898
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,7168,2048,8,384,2,16,balanced,0.3136586745580037
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,7168,2048,8,384,1,32,power_law_1.2,0.17656960487365722
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,7168,2048,8,384,2,16,balanced,0.32574933767318726
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,7168,2048,8,384,1,32,power_law_1.2,0.16972800493240356
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,7168,2048,8,384,2,16,balanced,0.33894399801890057
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,7168,2048,8,384,1,32,power_law_1.2,0.1852671980857849
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,7168,2048,8,384,2,16,balanced,0.3580373525619507
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,7168,2048,8,384,1,32,power_law_1.2,0.20257918834686278
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,7168,2048,8,384,1,32,power_law_1.2,0.20122239589691163
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,7168,2048,8,384,2,16,balanced,0.37567468484242755
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,7168,2048,8,384,1,32,power_law_1.2,0.24049921035766603
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,7168,2048,8,384,2,16,balanced,0.4135253429412842
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,7168,2048,8,384,1,32,power_law_1.2,0.288755202293396
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,7168,2048,8,384,2,16,balanced,0.45790934562683105
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,384,1,32,power_law_1.2,0.32366719245910647
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,384,1,32,power_law_1.2,0.3328383922576904
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,7168,2048,8,384,2,16,balanced,0.5200533469518026
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,384,1,32,power_law_1.2,0.41855359077453613
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,384,1,32,power_law_1.2,0.5711552143096924
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,7168,2048,8,384,2,16,balanced,0.6568373441696167
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,7168,2048,8,384,2,16,balanced,0.04965866605440775
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,384,1,32,power_law_1.2,0.6571839809417724
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,7168,2048,8,384,2,16,balanced,0.05117866893609365
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,384,1,32,power_law_1.2,0.9246720314025879
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,7168,2048,8,384,2,16,balanced,0.052970667680104576
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,7168,2048,8,384,2,16,balanced,0.06876266499360402
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,7168,2048,8,384,2,16,balanced,0.08911466598510742
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,384,1,32,power_law_1.2,1.1926719665527343
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,7168,2048,8,384,2,16,balanced,0.12986133495966592
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,7168,2048,8,384,2,16,balanced,0.7916426658630371
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,384,1,32,power_law_1.2,1.9193727493286132
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,7168,2048,8,384,2,16,balanced,0.17188799381256104
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,7168,2048,8,384,2,16,balanced,0.1734559933344523
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,384,1,32,power_law_1.2,2.267500877380371
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,7168,2048,8,384,2,16,balanced,0.17419199148813883
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,7168,2048,8,384,2,16,balanced,0.17507733901341757
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,384,1,32,power_law_1.2,2.997587203979492
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,7168,2048,8,384,2,16,balanced,0.1766080061594645
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,7168,2048,8,384,2,16,power_law_1.01,0.13038719892501832
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,7168,2048,8,384,2,16,balanced,0.17844800154368082
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,384,1,32,power_law_1.2,5.285107040405274
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,7168,2048,8,384,2,16,balanced,0.1810986598332723
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,7168,2048,8,384,2,16,power_law_1.01,0.21041278839111327
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,7168,2048,8,384,2,16,balanced,0.18228266636530557
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,7168,2048,8,384,2,16,balanced,1.0929546356201172
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,7168,2048,8,384,2,16,power_law_1.01,0.2826560020446777
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,384,1,32,power_law_1.2,9.746701049804688
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,7168,2048,8,384,2,16,balanced,0.19066667556762695
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,7168,2048,8,384,2,16,power_law_1.01,0.10264320373535156
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,7168,2048,8,384,2,16,balanced,0.1925599972407023
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,7168,2048,8,384,2,16,power_law_1.01,0.1265663981437683
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,7168,2048,8,384,2,16,balanced,0.19993066787719727
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,7168,2048,8,384,2,16,power_law_1.01,0.1600767970085144
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,7168,2048,8,384,2,16,balanced,0.04796266555786133
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,7168,2048,8,384,2,16,balanced,0.21276267369588217
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,7168,2048,8,384,2,16,power_law_1.01,0.19301120042800904
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,7168,2048,8,384,2,16,balanced,0.04858666658401489
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,7168,2048,8,384,2,16,balanced,0.22728532552719116
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,7168,2048,8,384,2,16,power_law_1.01,0.21938560009002686
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,7168,2048,8,384,2,16,balanced,0.053258667389551796
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,7168,2048,8,384,2,16,power_law_1.01,0.22702720165252685
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,7168,2048,8,384,2,16,balanced,0.07063466807206471
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,7168,2048,8,384,2,16,balanced,0.25379733244578045
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,7168,2048,8,384,2,16,power_law_1.01,0.24647040367126466
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,7168,2048,8,384,2,16,balanced,1.3426507314046223
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,7168,2048,8,384,2,16,balanced,0.09277333815892537
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,7168,2048,8,384,2,16,power_law_1.01,0.08731520175933838
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,7168,2048,8,384,2,16,balanced,0.2839946746826172
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,7168,2048,8,384,2,16,balanced,0.1291146675745646
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,7168,2048,8,384,2,16,power_law_1.01,0.23934719562530518
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,7168,2048,8,384,2,16,power_law_1.01,0.13092479705810547
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,7168,2048,8,384,2,16,balanced,0.17250667015711466
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,7168,2048,8,384,2,16,power_law_1.01,0.2569792032241821
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,7168,2048,8,384,2,16,power_law_1.01,0.09290879964828491
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,7168,2048,8,384,2,16,power_law_1.01,0.16392960548400878
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,7168,2048,8,384,2,16,balanced,0.33266667524973553
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,7168,2048,8,384,2,16,balanced,0.1731839974721273
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,7168,2048,8,384,2,16,power_law_1.01,0.2591808080673218
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,7168,2048,8,384,2,16,power_law_1.01,0.07215999960899352
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,7168,2048,8,384,2,16,power_law_1.01,0.1341312050819397
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,7168,2048,8,384,2,16,power_law_1.01,0.09006720185279846
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,7168,2048,8,384,2,16,balanced,0.17409066359202066
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,7168,2048,8,384,2,16,power_law_1.01,0.26195199489593507
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,7168,2048,8,384,2,16,power_law_1.01,0.1730944037437439
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,7168,2048,8,384,2,16,power_law_1.01,0.1139456033706665
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,7168,2048,8,384,2,16,balanced,0.17431465784708658
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,7168,2048,8,384,2,16,balanced,0.3867786725362142
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,7168,2048,8,384,2,16,power_law_1.01,0.2954432010650635
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,7168,2048,8,384,2,16,power_law_1.01,0.1245311975479126
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,7168,2048,8,384,2,16,power_law_1.01,0.07619839906692505
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,7168,2048,8,384,2,16,balanced,0.17602666219075522
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,7168,2048,8,384,2,16,power_law_1.01,0.1478335976600647
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,7168,2048,8,384,2,16,power_law_1.01,0.30709760189056395
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,7168,2048,8,384,2,16,power_law_1.01,0.09349759817123413
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,7168,2048,8,384,2,16,balanced,0.17972799142201742
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,7168,2048,8,384,2,16,power_law_1.01,0.13850879669189453
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,7168,2048,8,384,2,16,power_law_1.01,0.3117055892944336
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,7168,2048,8,384,2,16,power_law_1.01,0.11397119760513305
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,7168,2048,8,384,2,16,balanced,0.18069867293039957
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,7168,2048,8,384,2,16,power_law_1.01,0.1487231969833374
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,7168,2048,8,384,2,16,balanced,0.4798506498336792
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,7168,2048,8,384,2,16,power_law_1.01,0.15139199495315553
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,7168,2048,8,384,2,16,power_law_1.01,0.12144639492034912
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,7168,2048,8,384,2,16,balanced,0.18369599183400473
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,7168,2048,8,384,2,16,power_law_1.01,0.3499648094177246
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,7168,2048,8,384,2,16,power_law_1.01,0.15178879499435424
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,7168,2048,8,384,2,16,power_law_1.01,0.150873601436615
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,7168,2048,8,384,2,16,balanced,0.19114667177200317
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,7168,2048,8,384,2,16,power_law_1.01,0.3637439966201782
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,7168,2048,8,384,2,16,power_law_1.01,0.15898239612579346
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,7168,2048,8,384,2,16,power_law_1.01,0.14410879611968994
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,7168,2048,8,384,2,16,power_law_1.01,0.17074559926986693
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,7168,2048,8,384,2,16,balanced,0.19316265980402628
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,7168,2048,8,384,2,16,power_law_1.01,0.40838398933410647
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,7168,2048,8,384,2,16,balanced,1.9967947006225586
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,7168,2048,8,384,2,16,power_law_1.01,0.17568639516830445
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,7168,2048,8,384,2,16,power_law_1.01,0.14204800128936768
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,7168,2048,8,384,2,16,balanced,0.6133280197779337
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,7168,2048,8,384,2,16,balanced,0.20146133502324423
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,7168,2048,8,384,2,16,power_law_1.2,0.12047359943389893
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,7168,2048,8,384,2,16,power_law_1.01,0.45506558418273924
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,7168,2048,8,384,2,16,power_law_1.01,0.19173760414123536
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,7168,2048,8,384,2,16,power_law_1.01,0.15217280387878418
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,7168,2048,8,384,2,16,power_law_1.01,0.19372160434722902
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,7168,2048,8,384,2,16,balanced,0.21561066309611002
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,7168,2048,8,384,2,16,power_law_1.01,0.5800127983093262
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,7168,2048,8,384,2,16,power_law_1.2,0.21149439811706544
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,7168,2048,8,384,2,16,power_law_1.01,0.1627071976661682
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,7168,2048,8,384,2,16,power_law_1.01,0.21842560768127442
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,7168,2048,8,384,2,16,power_law_1.01,0.6628416061401368
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,7168,2048,8,384,2,16,power_law_1.2,0.2012928009033203
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,7168,2048,8,384,2,16,power_law_1.01,0.24142079353332518
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,7168,2048,8,384,2,16,power_law_1.01,0.16123520135879515
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,7168,2048,8,384,2,16,power_law_1.01,0.28307199478149414
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,7168,2048,8,384,2,16,power_law_1.01,0.8436223983764648
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,7168,2048,8,384,2,16,power_law_1.2,0.10127359628677368
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,7168,2048,8,384,2,16,power_law_1.01,0.16768640279769897
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,7168,2048,8,384,2,16,power_law_1.01,0.31290240287780763
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,7168,2048,8,384,2,16,power_law_1.2,0.1377344012260437
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,7168,2048,8,384,2,16,balanced,0.8039999802907308
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,7168,2048,8,384,2,16,power_law_1.01,1.025881576538086
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,384,2,16,balanced,0.23678400119145712
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,7168,2048,8,384,2,16,power_law_1.01,0.19543039798736572
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,7168,2048,8,384,2,16,power_law_1.01,0.43797760009765624
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,7168,2048,8,384,2,16,power_law_1.2,0.15781760215759277
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,7168,2048,8,384,2,16,power_law_1.01,1.2848832130432128
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,7168,2048,8,384,2,16,power_law_1.01,0.46030077934265134
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,7168,2048,8,384,2,16,power_law_1.01,0.20222079753875732
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,7168,2048,8,384,2,16,power_law_1.2,0.1505087971687317
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,7168,2048,8,384,2,16,power_law_1.01,0.6464896202087402
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,7168,2048,8,384,2,16,power_law_1.01,1.5881088256835938
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,7168,2048,8,384,2,16,power_law_1.01,0.21962239742279052
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,7168,2048,8,384,2,16,power_law_1.2,0.22037758827209472
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,7168,2048,8,384,2,16,power_law_1.01,0.8309439659118653
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,7168,2048,8,384,2,16,power_law_1.01,0.2850303888320923
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,7168,2048,8,384,2,16,power_law_1.01,1.1012351989746094
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,7168,2048,8,384,2,16,power_law_1.01,1.8496128082275392
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,7168,2048,8,384,2,16,power_law_1.2,0.2240000009536743
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,7168,2048,8,384,2,16,power_law_1.01,1.3599616050720216
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,7168,2048,8,384,2,16,power_law_1.2,0.23347840309143067
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,7168,2048,8,384,2,16,power_law_1.01,2.941971206665039
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,7168,2048,8,384,2,16,power_law_1.01,1.6644351959228516
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,7168,2048,8,384,2,16,balanced,1.0776267051696777
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,7168,2048,8,384,2,16,power_law_1.2,0.22926080226898193
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,384,2,16,power_law_1.01,0.28549120426177976
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,384,2,16,balanced,0.2704480091730754
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,7168,2048,8,384,2,16,power_law_1.01,2.62106876373291
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,7168,2048,8,384,2,16,power_law_1.01,5.873811340332031
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,7168,2048,8,384,2,16,power_law_1.2,0.24810240268707276
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,384,2,16,balanced,0.29942933718363446
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,7168,2048,8,384,2,16,power_law_1.01,5.581612777709961
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,7168,2048,8,384,2,16,power_law_1.2,0.25754880905151367
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,384,2,16,power_law_1.01,0.3339967966079712
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,7168,2048,8,384,2,16,power_law_1.2,0.28353281021118165
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,384,2,16,power_law_1.01,0.3827264070510864
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,384,2,16,balanced,0.3495306571324666
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,7168,2048,8,384,2,16,power_law_1.2,0.2948096036911011
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,384,2,16,power_law_1.01,0.5345471858978271
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,7168,2048,8,384,2,16,power_law_1.2,0.32003839015960694
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,7168,2048,8,384,2,16,power_law_1.2,0.299238395690918
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,7168,2048,8,384,2,16,power_law_1.2,0.37449600696563723
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,7168,2048,8,384,2,16,balanced,1.3540053367614746
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,384,2,16,power_law_1.01,0.5706240177154541
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,7168,2048,8,384,2,16,power_law_1.2,0.3783616065979004
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,384,2,16,balanced,0.43169601758321124
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,7168,2048,8,384,2,16,power_law_1.2,0.4839615821838379
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,384,2,16,power_law_1.01,0.7969791889190674
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,7168,2048,8,384,2,16,balanced,3.7335198720296225
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,7168,2048,8,384,2,16,power_law_1.2,0.5012735843658447
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,384,2,16,power_law_1.01,1.0850367546081543
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,384,2,16,balanced,0.5514933268229166
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,7168,2048,8,384,2,16,power_law_1.2,0.5744128227233887
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,384,2,16,power_law_1.01,1.5922752380371095
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,7168,2048,8,384,2,16,power_law_1.2,0.7245183944702148
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,384,2,16,power_law_1.01,2.0080127716064453
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,7168,2048,8,384,2,16,power_law_1.2,0.8905535697937011
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,384,2,16,power_law_1.01,2.6599552154541017
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,384,2,16,balanced,0.7693386872609457
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,7168,2048,8,384,2,16,power_law_1.2,1.1630208015441894
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,384,2,16,power_law_1.01,4.158943939208984
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,7168,2048,8,384,2,16,power_law_1.2,1.6242687225341796
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,384,2,16,power_law_1.01,8.073779296875
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,7168,2048,8,384,2,16,power_law_1.2,2.0307584762573243
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,7168,2048,8,384,2,16,balanced,2.0306827227274575
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,7168,2048,8,384,2,16,power_law_1.2,2.405075263977051
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,384,2,16,balanced,1.0047252972920735
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,7168,2048,8,384,2,16,power_law_1.2,3.7466686248779295
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,7168,2048,8,384,2,16,power_law_1.2,7.9531005859375
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,384,2,16,balanced,1.360640048980713
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,384,2,16,balanced,1.7160107294718425
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,7168,2048,8,384,2,16,power_law_1.2,0.08814719915390015
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,7168,2048,8,384,2,16,power_law_1.2,0.1325824022293091
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,7168,2048,8,384,2,16,power_law_1.2,0.10823040008544922
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,7168,2048,8,384,2,16,power_law_1.2,0.07429760098457336
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,7168,2048,8,384,2,16,power_law_1.2,0.09486719965934753
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,7168,2048,8,384,2,16,power_law_1.2,0.10377600193023681
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,7168,2048,8,384,2,16,balanced,3.884943962097168
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,7168,2048,8,384,2,16,power_law_1.2,0.10895999670028686
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,7168,2048,8,384,2,16,power_law_1.2,0.14203519821166993
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,7168,2048,8,384,2,16,power_law_1.2,0.14597760438919066
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,384,2,16,balanced,2.6673332850138345
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,7168,2048,8,384,2,16,power_law_1.2,0.1365504026412964
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,7168,2048,8,384,2,16,power_law_1.2,0.1522112011909485
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,7168,2048,8,384,2,16,power_law_1.2,0.15002880096435547
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,7168,2048,8,384,2,16,power_law_1.2,0.153164803981781
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,7168,2048,8,384,2,16,power_law_1.2,0.16978559494018555
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,7168,2048,8,384,2,16,power_law_1.2,0.18491519689559938
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,7168,2048,8,384,2,16,power_law_1.2,0.19474560022354126
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,7168,2048,8,384,2,16,power_law_1.2,0.19550080299377443
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,7168,2048,8,384,2,16,power_law_1.2,0.22527999877929689
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,7168,2048,8,384,2,16,power_law_1.2,0.24800639152526854
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,7168,2048,8,384,2,16,power_law_1.2,0.30969600677490233
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,7168,2048,8,384,2,16,power_law_1.2,0.34834558963775636
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,7168,2048,8,384,2,16,power_law_1.2,0.4684864044189453
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,7168,2048,8,384,2,16,power_law_1.2,0.5312575817108154
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,7168,2048,8,384,2,16,power_law_1.2,0.7035520076751709
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,7168,2048,8,384,2,16,power_law_1.2,0.9319104194641114
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,7168,2048,8,384,2,16,power_law_1.2,1.3177023887634278
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,7168,2048,8,384,2,16,power_law_1.2,1.4989631652832032
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,7168,2048,8,384,2,16,power_law_1.2,2.0722496032714846
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,384,2,16,balanced,5.180629412333171
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,7168,2048,8,384,2,16,power_law_1.2,3.0687231063842773
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,7168,2048,8,384,2,16,power_law_1.2,0.09635199904441834
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,7168,2048,8,384,2,16,power_law_1.2,0.13293440341949464
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,7168,2048,8,384,2,16,power_law_1.2,6.9265602111816404
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,7168,2048,8,384,2,16,power_law_1.2,0.0955839991569519
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,7168,2048,8,384,4,8,balanced,0.05691199998060862
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,7168,2048,8,384,2,16,power_law_1.2,0.07452160120010376
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,7168,2048,8,384,4,8,balanced,0.06621866424878438
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,7168,2048,8,384,4,8,balanced,0.06670933465162913
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,7168,2048,8,384,2,16,power_law_1.2,0.09217919707298279
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,7168,2048,8,384,4,8,balanced,0.08680533369382222
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,7168,2048,8,384,2,16,power_law_1.2,0.10380799770355224
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,7168,2048,8,384,4,8,balanced,0.1270026663939158
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,7168,2048,8,384,2,16,power_law_1.2,0.11819519996643066
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,7168,2048,8,384,4,8,balanced,0.20663466056187949
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,7168,2048,8,384,2,16,power_law_1.2,0.13898880481719972
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,7168,2048,8,384,4,8,balanced,0.2905600070953369
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,7168,2048,8,384,4,8,balanced,0.2944213350613912
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,7168,2048,8,384,4,8,balanced,0.04869333406289419
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,7168,2048,8,384,2,16,power_law_1.2,0.14867839813232422
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,7168,2048,8,384,4,8,balanced,0.293013334274292
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,7168,2048,8,384,4,8,balanced,0.05387733379999796
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,7168,2048,8,384,2,16,power_law_1.2,0.14394240379333495
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,7168,2048,8,384,4,8,balanced,0.2943039933840434
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,7168,2048,8,384,4,8,balanced,0.05384533107280731
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,7168,2048,8,384,2,16,power_law_1.2,0.15687040090560914
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,7168,2048,8,384,4,8,balanced,0.2946186661720276
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,7168,2048,8,384,4,8,balanced,0.0699946681658427
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,7168,2048,8,384,2,16,power_law_1.2,0.15701760053634645
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,7168,2048,8,384,4,8,balanced,0.3006986578305562
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,7168,2048,8,384,4,8,balanced,0.09212266405423482
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,7168,2048,8,384,4,8,balanced,0.3004693388938904
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,7168,2048,8,384,2,16,power_law_1.2,0.16901760101318358
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,7168,2048,8,384,4,8,balanced,0.13480533162752786
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,7168,2048,8,384,4,8,balanced,0.30401066939036053
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,7168,2048,8,384,2,16,power_law_1.2,0.18009599447250366
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,7168,2048,8,384,4,8,balanced,0.17710399627685547
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,7168,2048,8,384,4,8,balanced,0.3125493327776591
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,7168,2048,8,384,2,16,power_law_1.2,0.18750079870223998
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,7168,2048,8,384,4,8,balanced,0.17709332704544067
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,7168,2048,8,384,4,8,balanced,0.31465067466100055
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,7168,2048,8,384,4,8,balanced,0.17818133036295572
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,7168,2048,8,384,2,16,power_law_1.2,0.21663999557495117
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,7168,2048,8,384,4,8,balanced,0.17880533138910928
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,7168,2048,8,384,4,8,balanced,0.3224800030390422
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,7168,2048,8,384,2,16,power_law_1.2,0.22420480251312255
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,7168,2048,8,384,4,8,balanced,0.18183465798695883
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,7168,2048,8,384,4,8,balanced,0.33473066488901776
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,7168,2048,8,384,2,16,power_law_1.2,0.29815680980682374
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,7168,2048,8,384,4,8,balanced,0.18427733580271402
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,7168,2048,8,384,4,8,balanced,0.3466399908065796
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,7168,2048,8,384,4,8,balanced,0.0516480008761088
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,7168,2048,8,384,4,8,balanced,0.18619734048843384
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,7168,2048,8,384,4,8,power_law_1.01,0.08665599822998046
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,7168,2048,8,384,4,8,balanced,0.1889280080795288
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,7168,2048,8,384,4,8,balanced,0.055215999484062195
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,7168,2048,8,384,4,8,balanced,0.3736000061035156
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,384,2,16,power_law_1.2,0.34853758811950686
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,7168,2048,8,384,4,8,balanced,0.06140799820423126
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,7168,2048,8,384,4,8,balanced,0.1970026691754659
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,7168,2048,8,384,4,8,power_law_1.01,0.12108160257339477
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,7168,2048,8,384,4,8,balanced,0.07580799857775371
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,7168,2048,8,384,4,8,balanced,0.4060906569163005
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,7168,2048,8,384,4,8,balanced,0.20098666350046793
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,7168,2048,8,384,4,8,power_law_1.01,0.2008960008621216
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,7168,2048,8,384,4,8,balanced,0.09386666615804036
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,384,2,16,power_law_1.2,0.3296832084655762
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,7168,2048,8,384,4,8,balanced,0.1390666663646698
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,7168,2048,8,384,4,8,power_law_1.01,0.08469759821891784
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,7168,2048,8,384,4,8,balanced,0.2097866733868917
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,384,2,16,power_law_1.2,0.42186880111694336
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,7168,2048,8,384,4,8,balanced,0.18549867471059164
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,7168,2048,8,384,4,8,balanced,0.4471199909845988
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,7168,2048,8,384,4,8,power_law_1.01,0.11706880331039429
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,7168,2048,8,384,4,8,balanced,0.22502400477727255
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,7168,2048,8,384,4,8,balanced,0.1857866644859314
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,384,2,16,power_law_1.2,0.6351871967315674
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,7168,2048,8,384,4,8,power_law_1.01,0.14846080541610718
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,7168,2048,8,384,4,8,balanced,0.18699200948079428
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,7168,2048,8,384,4,8,balanced,0.2416800061861674
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,7168,2048,8,384,4,8,balanced,0.5017120043436686
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,7168,2048,8,384,4,8,balanced,0.18836800257364908
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,7168,2048,8,384,4,8,power_law_1.01,0.17089920043945311
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,384,2,16,power_law_1.2,0.6641536235809327
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,7168,2048,8,384,4,8,balanced,0.27426666021347046
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,7168,2048,8,384,4,8,balanced,0.19033066431681314
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,7168,2048,8,384,4,8,power_law_1.01,0.21143679618835448
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,384,2,16,power_law_1.2,0.9545536041259766
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,7168,2048,8,384,4,8,balanced,0.193231999874115
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,7168,2048,8,384,4,8,balanced,0.3153120080629985
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,7168,2048,8,384,4,8,power_law_1.01,0.23284480571746827
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,7168,2048,8,384,4,8,balanced,0.5897813240687052
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,7168,2048,8,384,4,8,balanced,0.19671465953191122
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,384,2,16,power_law_1.2,1.3034624099731444
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,7168,2048,8,384,4,8,power_law_1.01,0.22979199886322021
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,7168,2048,8,384,4,8,balanced,0.19875200589497885
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,7168,2048,8,384,4,8,balanced,0.3773866494496663
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,384,2,16,power_law_1.2,1.8494335174560548
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,7168,2048,8,384,4,8,power_law_1.01,0.237062406539917
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,7168,2048,8,384,4,8,balanced,0.20950400829315186
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,384,2,16,power_law_1.2,2.457164764404297
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,7168,2048,8,384,4,8,power_law_1.01,0.24186239242553711
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,7168,2048,8,384,4,8,balanced,0.21389333407084146
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,7168,2048,8,384,4,8,balanced,0.43329068024953205
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,7168,2048,8,384,4,8,balanced,0.7445013523101807
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,7168,2048,8,384,4,8,power_law_1.01,0.24179201126098632
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,384,2,16,power_law_1.2,3.077471923828125
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,7168,2048,8,384,4,8,balanced,0.22506133715311685
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,7168,2048,8,384,4,8,power_law_1.01,0.2553920030593872
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,7168,2048,8,384,4,8,balanced,0.24715199073155722
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,384,2,16,power_law_1.2,5.537190246582031
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,7168,2048,8,384,4,8,power_law_1.01,0.27696640491485597
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,7168,2048,8,384,4,8,balanced,0.5446240107218424
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,7168,2048,8,384,4,8,power_law_1.01,0.28549120426177976
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,384,2,16,power_law_1.2,9.147718048095703
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,7168,2048,8,384,4,8,power_law_1.01,0.29656319618225097
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,7168,2048,8,384,4,8,balanced,0.9281973044077555
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,7168,2048,8,384,4,8,power_law_1.01,0.0657472014427185
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,384,4,8,balanced,0.2683253288269043
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,7168,2048,8,384,4,8,power_law_1.01,0.3407104015350342
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,7168,2048,8,384,4,8,balanced,0.7053120136260986
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,7168,2048,8,384,4,8,power_law_1.01,0.08351359963417053
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,7168,2048,8,384,4,8,power_law_1.01,0.3556864023208618
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,7168,2048,8,384,4,8,power_law_1.01,0.12346240282058715
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,7168,2048,8,384,4,8,power_law_1.01,0.4072000026702881
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,7168,2048,8,384,4,8,power_law_1.01,0.06947839856147767
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,7168,2048,8,384,4,8,power_law_1.01,0.45664000511169434
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,7168,2048,8,384,4,8,power_law_1.01,0.08358399868011475
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,7168,2048,8,384,4,8,power_law_1.01,0.547270393371582
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,7168,2048,8,384,4,8,power_law_1.01,0.11367679834365844
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,384,4,8,balanced,0.3265226682027181
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,7168,2048,8,384,4,8,balanced,1.2550026575724285
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,7168,2048,8,384,4,8,balanced,0.9389493465423584
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,7168,2048,8,384,4,8,power_law_1.01,0.6178688049316406
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,7168,2048,8,384,4,8,power_law_1.01,0.11872639656066894
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,384,4,8,balanced,0.37988801797231037
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,7168,2048,8,384,4,8,power_law_1.01,0.792742395401001
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,7168,2048,8,384,4,8,power_law_1.01,0.13363200426101685
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,7168,2048,8,384,4,8,power_law_1.01,0.9621120452880859
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,384,4,8,balanced,0.46553067366282147
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,7168,2048,8,384,4,8,power_law_1.01,0.14851200580596924
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,7168,2048,8,384,4,8,power_law_1.01,1.3171520233154297
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,7168,2048,8,384,4,8,power_law_1.01,0.1488703966140747
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,7168,2048,8,384,4,8,power_law_1.01,1.7295040130615233
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,7168,2048,8,384,4,8,power_law_1.01,0.15642240047454833
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,384,4,8,balanced,0.5826026598612467
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,7168,2048,8,384,4,8,power_law_1.01,1.9419008255004884
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,7168,2048,8,384,4,8,balanced,1.249338706334432
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,7168,2048,8,384,4,8,power_law_1.01,0.1545408010482788
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,7168,2048,8,384,4,8,power_law_1.01,3.075641632080078
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,7168,2048,8,384,4,8,power_law_1.01,0.16750080585479737
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,7168,2048,8,384,4,8,balanced,1.5377012888590496
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,384,4,8,balanced,0.7474986712137858
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,7168,2048,8,384,4,8,power_law_1.01,0.16790399551391602
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,7168,2048,8,384,4,8,power_law_1.01,6.5019775390625
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,7168,2048,8,384,4,8,power_law_1.01,0.18499840497970582
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,7168,2048,8,384,4,8,power_law_1.01,0.19629440307617188
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,7168,2048,8,384,4,8,power_law_1.01,0.19883519411087036
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,384,4,8,balanced,1.0332159996032715
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,7168,2048,8,384,4,8,power_law_1.01,0.2302272081375122
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,7168,2048,8,384,4,8,balanced,1.5469652811686199
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,7168,2048,8,384,4,8,power_law_1.01,0.24956159591674804
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,7168,2048,8,384,4,8,power_law_1.01,0.30195839405059816
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,7168,2048,8,384,4,8,power_law_1.01,0.3310080051422119
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,384,4,8,balanced,1.378010590871175
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,7168,2048,8,384,4,8,power_law_1.01,0.46416640281677246
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,7168,2048,8,384,4,8,power_law_1.01,0.5132991790771484
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,7168,2048,8,384,4,8,balanced,2.3309760093688965
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,7168,2048,8,384,4,8,power_law_1.01,0.6680960178375244
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,7168,2048,8,384,4,8,power_law_1.01,0.8352191925048829
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,7168,2048,8,384,4,8,power_law_1.2,0.0870527982711792
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,7168,2048,8,384,4,8,power_law_1.01,1.1514880180358886
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,7168,2048,8,384,4,8,power_law_1.2,0.12061439752578736
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,7168,2048,8,384,4,8,power_law_1.01,0.07764480113983155
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,7168,2048,8,384,4,8,power_law_1.01,1.4693504333496095
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,384,4,8,balanced,1.8749705950419109
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,7168,2048,8,384,4,8,power_law_1.2,0.10864640474319458
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,7168,2048,8,384,4,8,power_law_1.01,0.097952002286911
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,7168,2048,8,384,4,8,power_law_1.2,0.08448640108108521
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,7168,2048,8,384,4,8,power_law_1.01,1.8791423797607423
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,7168,2048,8,384,4,8,power_law_1.01,0.14703999757766723
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,7168,2048,8,384,4,8,balanced,2.36297607421875
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,7168,2048,8,384,4,8,power_law_1.01,0.07407360076904297
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,7168,2048,8,384,4,8,power_law_1.2,0.12000000476837158
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,7168,2048,8,384,4,8,power_law_1.01,0.09649919867515563
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,7168,2048,8,384,4,8,power_law_1.01,2.932383918762207
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,7168,2048,8,384,4,8,power_law_1.2,0.13646080493927001
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,7168,2048,8,384,4,8,power_law_1.01,0.11514879465103149
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,7168,2048,8,384,4,8,power_law_1.2,0.16235519647598268
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,7168,2048,8,384,4,8,power_law_1.01,0.13200639486312865
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,7168,2048,8,384,4,8,power_law_1.01,5.456665420532227
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,7168,2048,8,384,4,8,power_law_1.01,0.14337919950485228
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,7168,2048,8,384,4,8,power_law_1.2,0.20563840866088867
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,7168,2048,8,384,4,8,power_law_1.01,0.14401919841766359
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,7168,2048,8,384,4,8,power_law_1.2,0.22885758876800538
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,7168,2048,8,384,4,8,power_law_1.01,0.15701760053634645
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,7168,2048,8,384,4,8,power_law_1.2,0.2209023952484131
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,7168,2048,8,384,4,8,power_law_1.01,0.16246399879455567
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,384,4,8,balanced,2.354933261871338
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,7168,2048,8,384,4,8,power_law_1.01,0.17503999471664428
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,7168,2048,8,384,4,8,power_law_1.2,0.22552320957183838
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,7168,2048,8,384,4,8,power_law_1.01,0.1790719985961914
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,7168,2048,8,384,4,8,power_law_1.2,0.23710720539093016
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,7168,2048,8,384,4,8,power_law_1.01,0.18544000387191772
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,7168,2048,8,384,4,8,power_law_1.01,0.20215680599212646
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,7168,2048,8,384,4,8,power_law_1.2,0.2528000116348267
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,7168,2048,8,384,4,8,power_law_1.01,0.21658239364624024
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,7168,2048,8,384,4,8,power_law_1.2,0.2598207950592041
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,7168,2048,8,384,4,8,power_law_1.01,0.2537087917327881
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,7168,2048,8,384,4,8,power_law_1.01,0.28047358989715576
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,7168,2048,8,384,4,8,power_law_1.2,0.2728319883346558
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,7168,2048,8,384,4,8,power_law_1.2,0.28650879859924316
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,384,4,8,power_law_1.01,0.3204224109649658
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,7168,2048,8,384,4,8,power_law_1.2,0.2962944030761719
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,7168,2048,8,384,4,8,power_law_1.2,0.33276801109313964
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,7168,2048,8,384,4,8,power_law_1.2,0.3631743907928467
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,384,4,8,power_law_1.01,0.36311678886413573
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,7168,2048,8,384,4,8,power_law_1.2,0.44588799476623536
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,384,4,8,power_law_1.01,0.46019840240478516
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,7168,2048,8,384,4,8,balanced,4.353946685791016
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,7168,2048,8,384,4,8,power_law_1.2,0.5050303936004639
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,384,4,8,power_law_1.01,0.5901247978210449
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,384,4,8,balanced,3.685248057047526
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,7168,2048,8,384,4,8,power_law_1.2,0.6060544013977051
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,384,4,8,power_law_1.01,0.7289919853210449
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,7168,2048,8,384,4,8,power_law_1.2,0.6987135887145997
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,384,4,8,power_law_1.01,1.0197183609008789
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,384,4,8,power_law_1.01,1.2491071701049805
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,7168,2048,8,384,4,8,power_law_1.2,0.8695743560791016
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,384,4,8,power_law_1.01,1.8479488372802735
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,7168,2048,8,384,4,8,power_law_1.2,1.102899169921875
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,7168,2048,8,384,4,8,balanced,4.507760047912598
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,384,4,8,power_law_1.01,2.4339519500732423
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,7168,2048,8,384,4,8,power_law_1.2,1.5091775894165038
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,384,4,8,power_law_1.01,3.055776023864746
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,7168,2048,8,384,4,8,power_law_1.2,1.8312576293945313
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,384,4,8,power_law_1.01,4.558636856079102
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,7168,2048,8,384,4,8,power_law_1.2,2.0856000900268556
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,384,4,8,power_law_1.01,9.545696258544922
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,7168,2048,8,384,4,8,power_law_1.2,3.311532974243164
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,7168,2048,8,384,4,8,power_law_1.2,7.873273468017578
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,7168,2048,8,384,4,8,power_law_1.2,0.06602240204811097
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,7168,2048,8,384,4,8,power_law_1.2,0.08344320058822632
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,7168,2048,8,384,4,8,power_law_1.2,0.07990400195121765
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,7168,2048,8,384,4,8,power_law_1.2,0.07022079825401306
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,7168,2048,8,384,4,8,power_law_1.2,0.0846015989780426
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,7168,2048,8,384,4,8,power_law_1.2,0.10587519407272339
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,7168,2048,8,384,4,8,power_law_1.2,0.11163519620895386
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,384,4,8,balanced,7.2030824025472
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,7168,2048,8,384,4,8,power_law_1.2,0.1356287956237793
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,7168,2048,8,384,4,8,power_law_1.2,0.13602559566497802
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,7168,2048,8,384,4,8,power_law_1.2,0.14371199607849122
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,7168,2048,8,384,4,8,power_law_1.2,0.14202879667282103
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,7168,2048,8,384,4,8,power_law_1.2,0.15448960065841674
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,7168,2048,8,384,4,8,power_law_1.2,0.16547839641571044
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,7168,2048,8,384,4,8,power_law_1.2,0.1738816022872925
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,7168,2048,8,384,4,8,power_law_1.2,0.1866752028465271
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,7168,2048,8,384,4,8,power_law_1.2,0.1991871953010559
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,7168,2048,8,384,4,8,power_law_1.2,0.20441598892211915
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,7168,2048,8,384,4,8,power_law_1.2,0.23128960132598878
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,7168,2048,8,384,4,8,power_law_1.2,0.2536895990371704
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,7168,2048,8,384,4,8,power_law_1.2,0.311244797706604
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,7168,2048,8,384,4,8,power_law_1.2,0.3606208086013794
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,7168,2048,8,384,4,8,power_law_1.2,0.07796480059623719
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,7168,2048,8,384,4,8,power_law_1.2,0.47735037803649905
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,7168,2048,8,384,4,8,power_law_1.2,0.09781759977340698
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,7168,2048,8,384,4,8,power_law_1.2,0.5456960201263428
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,7168,2048,8,384,4,8,power_law_1.2,0.07729920148849487
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,7168,2048,8,384,4,8,power_law_1.2,0.0775168001651764
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,7168,2048,8,384,4,8,power_law_1.2,0.7473343849182129
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,7168,2048,8,384,4,8,power_law_1.2,0.09411200284957885
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,7168,2048,8,384,4,8,power_law_1.2,0.906060791015625
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,7168,2048,8,384,4,8,power_law_1.2,0.10193920135498047
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,7168,2048,8,384,4,8,power_law_1.2,1.2253312110900878
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,7168,2048,8,384,4,8,power_law_1.2,0.12451839447021484
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,7168,2048,8,384,4,8,power_law_1.2,1.643846321105957
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,7168,2048,8,384,4,8,power_law_1.2,0.1418176054954529
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,7168,2048,8,384,4,8,power_law_1.2,2.0212223052978517
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,7168,2048,8,384,4,8,power_law_1.2,0.14495999813079835
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,7168,2048,8,384,4,8,power_law_1.2,0.1549888014793396
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,7168,2048,8,384,4,8,power_law_1.2,3.259475326538086
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,7168,2048,8,384,4,8,power_law_1.2,0.1586303949356079
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,7168,2048,8,384,4,8,power_law_1.2,6.571724700927734
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,7168,2048,8,384,4,8,power_law_1.2,0.17619199752807618
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,7168,2048,8,384,4,8,power_law_1.2,0.18554240465164185
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,7168,2048,8,384,4,8,power_law_1.2,0.18510719537734985
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,7168,2048,8,384,8,4,balanced,0.05682133138179779
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,7168,2048,8,384,4,8,power_law_1.2,0.211244797706604
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,7168,2048,8,384,8,4,balanced,0.05905599892139435
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,7168,2048,8,384,8,4,balanced,0.06746133168538411
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,7168,2048,8,384,4,8,power_law_1.2,0.22439041137695312
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,7168,2048,8,384,8,4,balanced,0.09078400333722432
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,7168,2048,8,384,4,8,power_law_1.2,0.25306239128112795
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,7168,2048,8,384,8,4,balanced,0.1357919971148173
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,7168,2048,8,384,4,8,power_law_1.2,0.3060352087020874
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,7168,2048,8,384,8,4,balanced,0.21469332774480185
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,7168,2048,8,384,8,4,balanced,0.30029867092768353
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,7168,2048,8,384,8,4,balanced,0.30189865827560425
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,384,4,8,power_law_1.2,0.3435967922210693
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,7168,2048,8,384,8,4,balanced,0.3007520039876302
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,7168,2048,8,384,8,4,balanced,0.30482665697733563
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,7168,2048,8,384,8,4,balanced,0.3071039915084839
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,384,4,8,power_law_1.2,0.40215039253234863
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,7168,2048,8,384,8,4,balanced,0.31229867537816364
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,384,4,8,power_law_1.2,0.4769728183746338
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,7168,2048,8,384,8,4,balanced,0.31330132484436035
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,7168,2048,8,384,8,4,balanced,0.31986133257548016
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,384,4,8,power_law_1.2,0.686406421661377
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,7168,2048,8,384,8,4,balanced,0.3275199929873149
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,384,4,8,power_law_1.2,0.8388799667358399
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,7168,2048,8,384,8,4,balanced,0.04982399940490723
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,7168,2048,8,384,8,4,balanced,0.3325600028038025
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,384,4,8,power_law_1.2,1.123200035095215
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,7168,2048,8,384,8,4,balanced,0.051882664362589516
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,7168,2048,8,384,8,4,balanced,0.34116268157958984
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,384,4,8,power_law_1.2,1.3345536231994628
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,7168,2048,8,384,8,4,balanced,0.05637866755326589
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,7168,2048,8,384,8,4,balanced,0.3667626778284709
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,7168,2048,8,384,8,4,balanced,0.07286933561166127
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,384,4,8,power_law_1.2,2.094380760192871
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,7168,2048,8,384,8,4,balanced,0.09928533434867859
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,7168,2048,8,384,8,4,balanced,0.37941332658131915
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,7168,2048,8,384,8,4,balanced,0.14735999703407288
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,384,4,8,power_law_1.2,2.807935905456543
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,7168,2048,8,384,8,4,balanced,0.4106026490529378
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,7168,2048,8,384,8,4,balanced,0.19538132349650064
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,384,4,8,power_law_1.2,3.420742416381836
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,7168,2048,8,384,8,4,balanced,0.19901333252588907
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,7168,2048,8,384,8,4,power_law_1.01,0.06476160287857055
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,7168,2048,8,384,8,4,balanced,0.4537920157114665
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,7168,2048,8,384,8,4,balanced,0.19896533091862997
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,384,4,8,power_law_1.2,5.028492736816406
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,7168,2048,8,384,8,4,power_law_1.01,0.0828224003314972
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,7168,2048,8,384,8,4,balanced,0.20272000630696616
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,7168,2048,8,384,8,4,balanced,0.5251413186391195
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,7168,2048,8,384,8,4,balanced,0.20432533820470175
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,7168,2048,8,384,8,4,power_law_1.01,0.12205439805984497
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,7168,2048,8,384,8,4,balanced,0.20915200312932333
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,7168,2048,8,384,8,4,balanced,0.06659733255704244
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,384,4,8,power_law_1.2,12.632780456542969
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,7168,2048,8,384,8,4,power_law_1.01,0.07983999848365783
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,7168,2048,8,384,8,4,balanced,0.21246933937072754
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,7168,2048,8,384,8,4,balanced,0.07094933092594147
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,7168,2048,8,384,8,4,power_law_1.01,0.11864960193634033
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,7168,2048,8,384,8,4,balanced,0.6078293323516846
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,7168,2048,8,384,8,4,balanced,0.07766399780909221
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,7168,2048,8,384,8,4,balanced,0.21756800015767416
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,7168,2048,8,384,8,4,power_law_1.01,0.15264639854431153
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,7168,2048,8,384,8,4,power_law_1.01,0.0545087993144989
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,7168,2048,8,384,8,4,balanced,0.09118933478991191
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,7168,2048,8,384,8,4,balanced,0.2278560002644857
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,7168,2048,8,384,8,4,balanced,0.11644267042477925
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,7168,2048,8,384,8,4,power_law_1.01,0.16792960166931153
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,7168,2048,8,384,8,4,balanced,0.1680319905281067
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,7168,2048,8,384,8,4,power_law_1.01,0.06627200245857238
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,7168,2048,8,384,8,4,balanced,0.23249600330988565
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,7168,2048,8,384,8,4,balanced,0.21672000487645468
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,7168,2048,8,384,8,4,balanced,0.7378880182902018
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,7168,2048,8,384,8,4,power_law_1.01,0.20828800201416015
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,7168,2048,8,384,8,4,power_law_1.01,0.0907584011554718
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,7168,2048,8,384,8,4,balanced,0.21841599543889365
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,7168,2048,8,384,8,4,balanced,0.24229333798090616
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,7168,2048,8,384,8,4,balanced,0.22174400091171265
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,7168,2048,8,384,8,4,power_law_1.01,0.22240641117095947
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,7168,2048,8,384,8,4,power_law_1.01,0.0706496000289917
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,7168,2048,8,384,8,4,balanced,0.22483199834823608
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,7168,2048,8,384,8,4,balanced,0.2632213234901428
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,7168,2048,8,384,8,4,power_law_1.01,0.23766400814056396
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,7168,2048,8,384,8,4,balanced,0.22775999704996744
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,7168,2048,8,384,8,4,power_law_1.01,0.08803840279579163
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,7168,2048,8,384,8,4,balanced,0.23280533154805502
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,7168,2048,8,384,8,4,balanced,0.28335465987523395
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,7168,2048,8,384,8,4,power_law_1.01,0.24715518951416016
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,7168,2048,8,384,8,4,balanced,0.9345333576202393
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,7168,2048,8,384,8,4,power_law_1.01,0.11287039518356323
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,7168,2048,8,384,8,4,balanced,0.23568000396092734
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,7168,2048,8,384,8,4,balanced,0.24589866399765015
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,7168,2048,8,384,8,4,power_law_1.01,0.2580032110214233
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,7168,2048,8,384,8,4,balanced,0.3227253357569377
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,7168,2048,8,384,8,4,power_law_1.01,0.12137600183486938
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,7168,2048,8,384,8,4,balanced,0.2580746610959371
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,7168,2048,8,384,8,4,power_law_1.01,0.26477439403533937
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,7168,2048,8,384,8,4,balanced,0.26290667057037354
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,7168,2048,8,384,8,4,power_law_1.01,0.13827840089797974
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,7168,2048,8,384,8,4,balanced,0.3726239999135335
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,7168,2048,8,384,8,4,balanced,0.2786613305409749
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,7168,2048,8,384,8,4,power_law_1.01,0.2813375949859619
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,7168,2048,8,384,8,4,power_law_1.01,0.153766405582428
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,7168,2048,8,384,8,4,balanced,0.3099520007769267
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,7168,2048,8,384,8,4,power_law_1.01,0.2915839910507202
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,7168,2048,8,384,8,4,power_law_1.01,0.15745279788970948
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,7168,2048,8,384,8,4,balanced,0.4414079984029134
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,7168,2048,8,384,8,4,balanced,1.2247467041015625
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,7168,2048,8,384,8,4,power_law_1.01,0.3006720066070557
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,7168,2048,8,384,8,4,power_law_1.01,0.16768640279769897
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,7168,2048,8,384,8,4,power_law_1.01,0.3157439947128296
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,7168,2048,8,384,8,4,power_law_1.01,0.17424639463424682
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,7168,2048,8,384,8,4,balanced,0.5270506540934244
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,384,8,4,balanced,0.37055468559265137
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,7168,2048,8,384,8,4,power_law_1.01,0.36710400581359864
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,7168,2048,8,384,8,4,power_law_1.01,0.18116480112075806
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,7168,2048,8,384,8,4,power_law_1.01,0.38946559429168703
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,7168,2048,8,384,8,4,power_law_1.01,0.19493759870529176
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,7168,2048,8,384,8,4,power_law_1.01,0.07809280157089234
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,7168,2048,8,384,8,4,power_law_1.01,0.47316479682922363
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,7168,2048,8,384,8,4,power_law_1.01,0.2114880084991455
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,7168,2048,8,384,8,4,balanced,0.68886931737264
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,7168,2048,8,384,8,4,power_law_1.01,0.09031040072441102
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,7168,2048,8,384,8,4,power_law_1.01,0.5151040077209472
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,7168,2048,8,384,8,4,power_law_1.01,0.22459518909454346
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,7168,2048,8,384,8,4,balanced,1.6413226127624512
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,7168,2048,8,384,8,4,power_law_1.01,0.11663360595703125
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,7168,2048,8,384,8,4,power_law_1.01,0.2214207887649536
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,7168,2048,8,384,8,4,power_law_1.01,0.6255807876586914
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,384,8,4,balanced,0.48469332853953045
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,7168,2048,8,384,8,4,power_law_1.01,0.0913856029510498
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,7168,2048,8,384,8,4,power_law_1.01,0.26302080154418944
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,7168,2048,8,384,8,4,power_law_1.01,0.6893695831298828
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,7168,2048,8,384,8,4,power_law_1.01,0.10061440467834473
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,384,8,4,balanced,0.5616533358891805
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,7168,2048,8,384,8,4,balanced,0.8929653167724609
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,7168,2048,8,384,8,4,power_law_1.01,0.29555840492248536
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,7168,2048,8,384,8,4,power_law_1.01,0.13351039886474608
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,7168,2048,8,384,8,4,power_law_1.01,0.8903167724609375
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,7168,2048,8,384,8,4,power_law_1.01,0.37087359428405764
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,7168,2048,8,384,8,4,power_law_1.01,0.1479871988296509
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,384,8,4,balanced,0.6800159613291422
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,7168,2048,8,384,8,4,power_law_1.01,1.2132479667663574
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,7168,2048,8,384,8,4,power_law_1.01,0.40351362228393556
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,7168,2048,8,384,8,4,power_law_1.01,0.169542396068573
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,7168,2048,8,384,8,4,power_law_1.01,1.6021120071411132
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,384,8,4,balanced,0.8933119773864746
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,7168,2048,8,384,8,4,power_law_1.01,0.17460479736328124
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,7168,2048,8,384,8,4,power_law_1.01,0.49857277870178224
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,7168,2048,8,384,8,4,power_law_1.01,1.845267105102539
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,7168,2048,8,384,8,4,power_law_1.01,0.18625919818878173
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,7168,2048,8,384,8,4,power_law_1.01,0.5972032070159912
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,7168,2048,8,384,8,4,balanced,1.229535977045695
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,7168,2048,8,384,8,4,balanced,1.9978186289469402
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,7168,2048,8,384,8,4,power_law_1.01,2.176812744140625
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,7168,2048,8,384,8,4,power_law_1.01,0.1913472056388855
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,7168,2048,8,384,8,4,power_law_1.01,0.7681920051574707
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,384,8,4,balanced,1.1597599983215332
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,7168,2048,8,384,8,4,power_law_1.01,0.20622079372406005
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,7168,2048,8,384,8,4,power_law_1.01,0.9749183654785156
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,7168,2048,8,384,8,4,power_law_1.01,3.6453121185302733
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,7168,2048,8,384,8,4,power_law_1.01,0.21254398822784423
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,7168,2048,8,384,8,4,power_law_1.01,1.4156800270080567
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,7168,2048,8,384,8,4,power_law_1.01,0.23864960670471191
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,7168,2048,8,384,8,4,power_law_1.01,6.532991790771485
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,7168,2048,8,384,8,4,power_law_1.01,1.8041536331176757
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,384,8,4,balanced,1.6483893394470215
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,7168,2048,8,384,8,4,power_law_1.01,0.2531519889831543
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,7168,2048,8,384,8,4,power_law_1.01,2.135468864440918
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,7168,2048,8,384,8,4,power_law_1.01,0.2702719926834106
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,7168,2048,8,384,8,4,balanced,1.627120018005371
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,7168,2048,8,384,8,4,power_law_1.01,3.4525310516357424
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,7168,2048,8,384,8,4,power_law_1.01,0.30665600299835205
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,7168,2048,8,384,8,4,power_law_1.01,0.37909119129180907
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,7168,2048,8,384,8,4,power_law_1.01,6.728550720214844
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,384,8,4,balanced,2.224575996398926
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,384,8,4,power_law_1.01,0.45777277946472167
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,7168,2048,8,384,8,4,balanced,3.014122645060221
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,384,8,4,power_law_1.01,0.5557504177093506
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,7168,2048,8,384,8,4,power_law_1.2,0.06492159962654113
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,7168,2048,8,384,8,4,balanced,2.00874662399292
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,384,8,4,power_law_1.01,0.6250688076019287
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,7168,2048,8,384,8,4,power_law_1.2,0.08262400031089782
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,384,8,4,balanced,2.983274777730306
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,384,8,4,power_law_1.01,0.8288064002990723
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,7168,2048,8,384,8,4,power_law_1.2,0.07262719869613647
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,384,8,4,power_law_1.01,1.0467647552490233
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,7168,2048,8,384,8,4,power_law_1.2,0.07896320223808288
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,384,8,4,power_law_1.01,1.4157888412475585
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,7168,2048,8,384,8,4,power_law_1.2,0.1085312008857727
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,384,8,4,power_law_1.01,1.7995136260986329
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,7168,2048,8,384,8,4,power_law_1.2,0.1368191957473755
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,7168,2048,8,384,8,4,power_law_1.2,0.152729594707489
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,384,8,4,power_law_1.01,2.564703941345215
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,7168,2048,8,384,8,4,power_law_1.2,0.20398080348968506
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,384,8,4,power_law_1.01,3.45813102722168
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,7168,2048,8,384,8,4,power_law_1.2,0.21475839614868164
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,384,8,4,balanced,3.7112693786621094
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,7168,2048,8,384,8,4,power_law_1.2,0.22503039836883545
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,384,8,4,power_law_1.01,4.343167877197265
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,7168,2048,8,384,8,4,power_law_1.2,0.23602559566497802
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,7168,2048,8,384,8,4,power_law_1.2,0.2560703992843628
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,384,8,4,power_law_1.01,6.783993530273437
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,7168,2048,8,384,8,4,power_law_1.2,0.2632256031036377
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,7168,2048,8,384,8,4,balanced,3.067632039388021
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,7168,2048,8,384,8,4,power_law_1.2,0.2776063919067383
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,384,8,4,power_law_1.01,13.702963256835938
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,7168,2048,8,384,8,4,power_law_1.2,0.2970815896987915
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,7168,2048,8,384,8,4,power_law_1.2,0.310700798034668
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,7168,2048,8,384,8,4,power_law_1.2,0.3238719940185547
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,7168,2048,8,384,8,4,power_law_1.2,0.3652672052383423
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,7168,2048,8,384,8,4,power_law_1.2,0.4151103973388672
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,7168,2048,8,384,8,4,power_law_1.2,0.4936192035675049
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,384,8,4,balanced,5.8064320882161455
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,7168,2048,8,384,8,4,balanced,5.616832097371419
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,7168,2048,8,384,8,4,power_law_1.2,0.5264256000518799
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,7168,2048,8,384,8,4,power_law_1.2,0.6661695957183837
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,7168,2048,8,384,8,4,power_law_1.2,0.7192895889282227
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,7168,2048,8,384,8,4,power_law_1.2,0.9250816345214844
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,7168,2048,8,384,8,4,power_law_1.2,0.054636800289154054
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,7168,2048,8,384,8,4,power_law_1.2,1.2995455741882325
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,7168,2048,8,384,8,4,power_law_1.2,0.06648319959640503
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,7168,2048,8,384,8,4,power_law_1.2,1.7858495712280273
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,7168,2048,8,384,8,4,power_law_1.2,0.06758400201797485
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,7168,2048,8,384,8,4,power_law_1.2,2.131820869445801
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,7168,2048,8,384,8,4,power_law_1.2,0.06865919828414917
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,7168,2048,8,384,8,4,power_law_1.2,0.08673920035362244
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,7168,2048,8,384,8,4,power_law_1.2,2.4664831161499023
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,7168,2048,8,384,8,4,power_law_1.2,0.10192639827728271
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,7168,2048,8,384,8,4,power_law_1.2,4.102975845336914
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,7168,2048,8,384,8,4,power_law_1.2,0.11889280080795288
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,7168,2048,8,384,8,4,power_law_1.2,0.13690240383148194
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,7168,2048,8,384,8,4,power_law_1.2,7.349465942382812
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,7168,2048,8,384,8,4,power_law_1.2,0.14862719774246216
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,7168,2048,8,384,8,4,balanced,5.831872304280599
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,7168,2048,8,384,8,4,power_law_1.2,0.1550336003303528
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,7168,2048,8,384,8,4,power_law_1.2,0.170579195022583
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,7168,2048,8,384,8,4,power_law_1.2,0.17415679693222047
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,7168,2048,8,384,8,4,power_law_1.2,0.1781823992729187
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,7168,2048,8,384,8,4,power_law_1.2,0.18787839412689208
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,7168,2048,8,384,8,4,power_law_1.2,0.21194241046905518
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,7168,2048,8,384,8,4,power_law_1.2,0.21843841075897216
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,384,8,4,balanced,11.40057627360026
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,7168,2048,8,384,8,4,power_law_1.2,0.22872960567474365
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,7168,2048,8,384,8,4,power_law_1.2,0.26508800983428954
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,7168,2048,8,384,8,4,power_law_1.2,0.31064960956573484
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,7168,2048,8,384,8,4,power_law_1.2,0.37650558948516843
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,7168,2048,8,384,8,4,power_law_1.2,0.41891841888427733
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,7168,2048,8,384,8,4,power_law_1.2,0.5219840049743653
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,7168,2048,8,384,8,4,power_law_1.2,0.6366464138031006
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,7168,2048,8,384,8,4,power_law_1.2,0.7978240013122558
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,7168,2048,8,384,8,4,power_law_1.2,1.0148672103881835
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,7168,2048,8,384,8,4,power_law_1.2,1.498316764831543
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,7168,2048,8,384,8,4,power_law_1.2,1.941766357421875
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,7168,2048,8,384,8,4,power_law_1.2,2.2587072372436525
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,7168,2048,8,384,8,4,power_law_1.2,3.925606536865234
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,7168,2048,8,384,8,4,power_law_1.2,6.819468688964844
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,7168,2048,8,384,8,4,power_law_1.2,0.07798399925231933
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,7168,2048,8,384,8,4,power_law_1.2,0.09059839844703674
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,7168,2048,8,384,16,2,balanced,0.0595360000928243
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,7168,2048,8,384,8,4,power_law_1.2,0.08794239759445191
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,7168,2048,8,384,16,2,balanced,0.06403199831644694
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,7168,2048,8,384,8,4,power_law_1.2,0.089273601770401
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,7168,2048,8,384,16,2,balanced,0.07268266876538594
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,7168,2048,8,384,8,4,power_law_1.2,0.10503679513931274
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,7168,2048,8,384,16,2,balanced,0.09828799962997437
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,7168,2048,8,384,16,2,balanced,0.1498293379942576
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,7168,2048,8,384,8,4,power_law_1.2,0.12707200050354003
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,7168,2048,8,384,16,2,balanced,0.24413333336512247
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,7168,2048,8,384,16,2,balanced,0.34377598762512207
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,7168,2048,8,384,8,4,power_law_1.2,0.14186240434646608
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,7168,2048,8,384,16,2,balanced,0.34419198830922443
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,7168,2048,8,384,8,4,power_law_1.2,0.1671872019767761
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,7168,2048,8,384,16,2,balanced,0.3487199942270915
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,7168,2048,8,384,16,2,balanced,0.351151982943217
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,7168,2048,8,384,8,4,power_law_1.2,0.17115520238876342
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,7168,2048,8,384,16,2,balanced,0.3439146677652995
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,7168,2048,8,384,8,4,power_law_1.2,0.17933440208435059
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,7168,2048,8,384,16,2,balanced,0.34986666838328045
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,7168,2048,8,384,16,2,balanced,0.35317333539326984
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,7168,2048,8,384,8,4,power_law_1.2,0.18069759607315064
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,7168,2048,8,384,16,2,balanced,0.3535786469777425
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,7168,2048,8,384,8,4,power_law_1.2,0.2020479917526245
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,7168,2048,8,384,16,2,balanced,0.36345068613688153
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,7168,2048,8,384,8,4,power_law_1.2,0.2132863998413086
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,7168,2048,8,384,16,2,balanced,0.36849065621693927
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,7168,2048,8,384,8,4,power_law_1.2,0.22755200862884523
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,7168,2048,8,384,16,2,balanced,0.38733331362406415
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,7168,2048,8,384,8,4,power_law_1.2,0.2557440042495728
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,7168,2048,8,384,16,2,balanced,0.4174933433532715
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,7168,2048,8,384,8,4,power_law_1.2,0.2781440019607544
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,7168,2048,8,384,16,2,balanced,0.4402773380279541
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,7168,2048,8,384,8,4,power_law_1.2,0.3111936092376709
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,7168,2048,8,384,16,2,balanced,0.50054931640625
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,7168,2048,8,384,8,4,power_law_1.2,0.4018303871154785
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,7168,2048,8,384,16,2,balanced,0.5846293369928995
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,384,8,4,power_law_1.2,0.4784063816070557
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,7168,2048,8,384,16,2,balanced,0.052671998739242554
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,7168,2048,8,384,16,2,balanced,0.6752959887186686
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,7168,2048,8,384,16,2,balanced,0.05574933191140493
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,7168,2048,8,384,16,2,balanced,0.06128533184528351
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,384,8,4,power_law_1.2,0.540550422668457
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,7168,2048,8,384,16,2,balanced,0.0823520024617513
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,7168,2048,8,384,16,2,balanced,0.8064533074696859
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,7168,2048,8,384,16,2,balanced,0.1165706713994344
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,384,8,4,power_law_1.2,0.6679488182067871
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,7168,2048,8,384,16,2,balanced,0.1812959909439087
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,384,8,4,power_law_1.2,0.8324095726013183
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,7168,2048,8,384,16,2,balanced,0.24497065941492716
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,7168,2048,8,384,16,2,balanced,1.0397173563639324
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,7168,2048,8,384,16,2,balanced,0.24616533517837524
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,384,8,4,power_law_1.2,1.0754816055297851
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,7168,2048,8,384,16,2,balanced,0.2489759922027588
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,384,8,4,power_law_1.2,1.6116479873657226
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,7168,2048,8,384,16,2,balanced,0.25175466140111286
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,7168,2048,8,384,16,2,balanced,0.25574400027592975
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,384,8,4,power_law_1.2,1.9548736572265626
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,7168,2048,8,384,16,2,balanced,0.2600906689961751
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,7168,2048,8,384,16,2,balanced,1.3517653147379558
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,7168,2048,8,384,16,2,balanced,0.26316799720128375
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,384,8,4,power_law_1.2,2.811686325073242
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,7168,2048,8,384,16,2,balanced,0.26898133754730225
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,384,8,4,power_law_1.2,3.7470977783203123
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,7168,2048,8,384,16,2,balanced,0.28123732407887775
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,7168,2048,8,384,16,2,balanced,0.09654399752616882
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,7168,2048,8,384,16,2,balanced,0.2885013421376546
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,384,8,4,power_law_1.2,4.645836639404297
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,7168,2048,8,384,16,2,balanced,0.10268266995747884
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,7168,2048,8,384,16,2,balanced,0.30638400713602704
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,7168,2048,8,384,16,2,balanced,1.8703786532084148
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,7168,2048,8,384,16,2,balanced,0.111135999361674
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,384,8,4,power_law_1.2,7.436275482177734
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,7168,2048,8,384,16,2,balanced,0.12966400384902954
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,7168,2048,8,384,16,2,balanced,0.33259199062983197
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,7168,2048,8,384,16,2,balanced,0.16131200393040976
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,7168,2048,8,384,16,2,balanced,0.3673066695531209
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,7168,2048,8,384,16,2,balanced,0.22639999787012735
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,7168,2048,8,384,16,2,balanced,0.2890346646308899
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,384,8,4,power_law_1.2,14.704261779785156
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,7168,2048,8,384,16,2,balanced,0.42923200130462646
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,7168,2048,8,384,16,2,balanced,0.2943519949913025
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,7168,2048,8,384,16,2,balanced,0.3017759919166565
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,7168,2048,8,384,16,2,balanced,0.49907199541727704
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,7168,2048,8,384,16,2,balanced,0.3055199980735779
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,7168,2048,8,384,16,2,balanced,2.3700265884399414
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,7168,2048,8,384,16,2,balanced,0.3173706730206807
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,7168,2048,8,384,16,2,balanced,0.5909546613693237
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,7168,2048,8,384,16,2,balanced,0.32144532601038617
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,7168,2048,8,384,16,2,power_law_1.01,0.05262719988822937
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,7168,2048,8,384,16,2,power_law_1.01,0.059359997510910034
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,7168,2048,8,384,16,2,balanced,0.3287946581840515
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,7168,2048,8,384,16,2,power_law_1.01,0.05904639959335327
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,7168,2048,8,384,16,2,balanced,0.34141866366068524
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,7168,2048,8,384,16,2,power_law_1.01,0.0689087986946106
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,7168,2048,8,384,16,2,balanced,0.7237386703491211
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,7168,2048,8,384,16,2,power_law_1.01,0.07534080147743225
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,7168,2048,8,384,16,2,balanced,0.3643519878387451
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,7168,2048,8,384,16,2,power_law_1.01,0.09052159786224365
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,7168,2048,8,384,16,2,power_law_1.01,0.07289599776268005
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,7168,2048,8,384,16,2,balanced,0.37302935123443604
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,7168,2048,8,384,16,2,power_law_1.01,0.08490239977836608
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,7168,2048,8,384,16,2,balanced,0.9900000095367432
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,7168,2048,8,384,16,2,power_law_1.01,0.10087679624557495
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,7168,2048,8,384,16,2,balanced,0.4145706494649251
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,7168,2048,8,384,16,2,power_law_1.01,0.12208000421524048
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,7168,2048,8,384,16,2,balanced,2.980640093485514
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,7168,2048,8,384,16,2,power_law_1.01,0.12932480573654176
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,7168,2048,8,384,16,2,power_law_1.01,0.16297600269317628
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,7168,2048,8,384,16,2,balanced,0.48075199127197266
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,7168,2048,8,384,16,2,power_law_1.01,0.14258559942245483
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,7168,2048,8,384,16,2,power_law_1.01,0.17626880407333373
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,7168,2048,8,384,16,2,power_law_1.01,0.09548799991607666
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,7168,2048,8,384,16,2,power_law_1.01,0.17380479574203492
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,7168,2048,8,384,16,2,power_law_1.01,0.24082560539245607
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,7168,2048,8,384,16,2,balanced,1.3040053049723308
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,7168,2048,8,384,16,2,power_law_1.01,0.18742400407791138
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,7168,2048,8,384,16,2,power_law_1.01,0.10354559421539307
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,7168,2048,8,384,16,2,power_law_1.01,0.24528000354766846
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,7168,2048,8,384,16,2,power_law_1.01,0.12183040380477905
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,384,16,2,balanced,0.5795733531316122
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,7168,2048,8,384,16,2,power_law_1.01,0.18945280313491822
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,7168,2048,8,384,16,2,power_law_1.01,0.2566015958786011
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,7168,2048,8,384,16,2,power_law_1.01,0.12168960571289063
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,7168,2048,8,384,16,2,power_law_1.01,0.19952640533447266
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,7168,2048,8,384,16,2,power_law_1.01,0.27859840393066404
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,7168,2048,8,384,16,2,power_law_1.01,0.14039679765701293
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,7168,2048,8,384,16,2,power_law_1.01,0.17264000177383423
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,7168,2048,8,384,16,2,power_law_1.01,0.21484160423278809
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,7168,2048,8,384,16,2,power_law_1.01,0.28536961078643797
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,7168,2048,8,384,16,2,power_law_1.01,0.19566719532012938
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,7168,2048,8,384,16,2,balanced,1.844048023223877
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,7168,2048,8,384,16,2,power_law_1.01,0.21941120624542237
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,7168,2048,8,384,16,2,power_law_1.01,0.29555840492248536
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,7168,2048,8,384,16,2,power_law_1.01,0.2239743947982788
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,7168,2048,8,384,16,2,power_law_1.01,0.23551359176635742
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,7168,2048,8,384,16,2,power_law_1.01,0.23991041183471679
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,7168,2048,8,384,16,2,power_law_1.01,0.3173759937286377
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,384,16,2,balanced,0.7678186893463135
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,7168,2048,8,384,16,2,power_law_1.01,0.24593279361724854
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,7168,2048,8,384,16,2,power_law_1.01,0.25914878845214845
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,7168,2048,8,384,16,2,power_law_1.01,0.33397760391235354
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,7168,2048,8,384,16,2,power_law_1.01,0.26352639198303224
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,7168,2048,8,384,16,2,power_law_1.01,0.27236480712890626
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,384,16,2,balanced,0.9062346617380778
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,7168,2048,8,384,16,2,power_law_1.01,0.35199360847473143
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,7168,2048,8,384,16,2,power_law_1.01,0.27479679584503175
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,7168,2048,8,384,16,2,power_law_1.01,0.2913856029510498
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,7168,2048,8,384,16,2,power_law_1.01,0.28136959075927737
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,7168,2048,8,384,16,2,balanced,4.5368852615356445
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,7168,2048,8,384,16,2,power_law_1.01,0.35112318992614744
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,7168,2048,8,384,16,2,power_law_1.01,0.31300480365753175
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,384,16,2,balanced,1.1116053263346355
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,7168,2048,8,384,16,2,power_law_1.01,0.32836480140686036
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,7168,2048,8,384,16,2,power_law_1.01,0.4152575969696045
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,7168,2048,8,384,16,2,power_law_1.01,0.3425663948059082
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,7168,2048,8,384,16,2,balanced,2.3340746561686196
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,7168,2048,8,384,16,2,power_law_1.01,0.3784447908401489
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,7168,2048,8,384,16,2,power_law_1.01,0.4601920127868652
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,7168,2048,8,384,16,2,power_law_1.01,0.37102720737457273
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,7168,2048,8,384,16,2,power_law_1.01,0.4648320198059082
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,7168,2048,8,384,16,2,power_law_1.01,0.550105619430542
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,384,16,2,balanced,1.4973759651184082
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,7168,2048,8,384,16,2,power_law_1.01,0.43389439582824707
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,7168,2048,8,384,16,2,power_law_1.01,0.5520703792572021
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,7168,2048,8,384,16,2,power_law_1.01,0.5175104141235352
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,7168,2048,8,384,16,2,power_law_1.01,0.5906239986419678
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,7168,2048,8,384,16,2,power_law_1.01,0.6382719993591308
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,7168,2048,8,384,16,2,power_law_1.01,0.7183743953704834
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,384,16,2,balanced,1.9699947039286296
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,384,16,2,power_law_1.01,0.6448383808135987
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,7168,2048,8,384,16,2,power_law_1.01,0.8725184440612793
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,7168,2048,8,384,16,2,power_law_1.01,0.7786431789398194
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,7168,2048,8,384,16,2,power_law_1.2,0.05939840078353882
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,7168,2048,8,384,16,2,power_law_1.01,1.122054386138916
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,7168,2048,8,384,16,2,power_law_1.01,1.0463744163513184
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,7168,2048,8,384,16,2,power_law_1.2,0.07071999907493591
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,384,16,2,power_law_1.01,0.7637055873870849
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,7168,2048,8,384,16,2,power_law_1.01,1.3430975914001464
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,7168,2048,8,384,16,2,power_law_1.01,1.4301247596740723
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,7168,2048,8,384,16,2,power_law_1.2,0.07255679965019227
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,7168,2048,8,384,16,2,balanced,2.9293225606282554
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,384,16,2,power_law_1.01,0.9340864181518554
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,384,16,2,balanced,2.7770347595214844
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,7168,2048,8,384,16,2,power_law_1.01,1.910163116455078
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,7168,2048,8,384,16,2,power_law_1.01,1.983942413330078
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,7168,2048,8,384,16,2,power_law_1.2,0.08243200182914734
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,384,16,2,power_law_1.01,1.2889408111572265
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,384,16,2,power_law_1.01,1.5714943885803223
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,7168,2048,8,384,16,2,power_law_1.01,2.4911935806274412
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,7168,2048,8,384,16,2,power_law_1.2,0.11409280300140381
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,7168,2048,8,384,16,2,power_law_1.01,2.569375991821289
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,384,16,2,power_law_1.01,2.293049621582031
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,7168,2048,8,384,16,2,power_law_1.2,0.14391679763793946
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,7168,2048,8,384,16,2,power_law_1.01,3.050592041015625
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,7168,2048,8,384,16,2,power_law_1.01,3.1414976119995117
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,384,16,2,power_law_1.01,2.965216064453125
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,7168,2048,8,384,16,2,power_law_1.2,0.16015360355377198
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,384,16,2,power_law_1.01,4.144172668457031
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,7168,2048,8,384,16,2,power_law_1.01,4.736979293823242
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,7168,2048,8,384,16,2,power_law_1.01,4.953964614868164
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,7168,2048,8,384,16,2,power_law_1.2,0.22304000854492187
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,384,16,2,balanced,3.7873814900716147
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,384,16,2,power_law_1.01,5.386547088623047
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,7168,2048,8,384,16,2,power_law_1.2,0.23323519229888917
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,7168,2048,8,384,16,2,power_law_1.01,9.482169342041015
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,7168,2048,8,384,16,2,power_law_1.2,0.2507904052734375
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,7168,2048,8,384,16,2,power_law_1.01,9.87078399658203
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,384,16,2,power_law_1.01,6.827487945556641
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,7168,2048,8,384,16,2,power_law_1.2,0.2634687900543213
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,384,16,2,power_law_1.01,10.356288146972656
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,7168,2048,8,384,16,2,power_law_1.2,0.2854975938796997
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,7168,2048,8,384,16,2,power_law_1.2,0.2929408073425293
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,384,16,2,power_law_1.01,21.706758117675783
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,7168,2048,8,384,16,2,balanced,4.484437306722005
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,7168,2048,8,384,16,2,power_law_1.2,0.3248831987380981
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,384,16,2,balanced,5.154831886291504
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,7168,2048,8,384,16,2,power_law_1.2,0.33720319271087645
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,7168,2048,8,384,16,2,balanced,8.452608108520508
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,7168,2048,8,384,16,2,power_law_1.2,0.3579391956329346
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,7168,2048,8,384,16,2,power_law_1.2,0.3620160102844238
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,7168,2048,8,384,16,2,power_law_1.2,0.42084479331970215
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,7168,2048,8,384,16,2,power_law_1.2,0.46666879653930665
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,7168,2048,8,384,16,2,power_law_1.2,0.584876823425293
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,7168,2048,8,384,16,2,power_law_1.2,0.615283203125
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,7168,2048,8,384,16,2,power_law_1.2,0.7823552131652832
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,384,16,2,balanced,6.424736022949219
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,7168,2048,8,384,16,2,power_law_1.2,0.9356224060058593
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,7168,2048,8,384,16,2,power_law_1.2,1.2194239616394043
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,7168,2048,8,384,16,2,power_law_1.2,1.514361572265625
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,7168,2048,8,384,16,2,power_law_1.2,2.0767168045043944
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,7168,2048,8,384,16,2,power_law_1.2,2.695052719116211
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,7168,2048,8,384,16,2,power_law_1.2,3.2637630462646485
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,7168,2048,8,384,16,2,power_law_1.2,5.460563278198242
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,7168,2048,8,384,16,2,power_law_1.2,10.193785858154296
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,384,16,2,balanced,10.069295883178711
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,7168,2048,8,384,16,2,balanced,8.61346689860026
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,7168,2048,8,384,16,2,power_law_1.2,0.05319039821624756
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,7168,2048,8,384,16,2,power_law_1.2,0.058182400465011594
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,7168,2048,8,384,16,2,power_law_1.2,0.06212480068206787
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,7168,2048,8,384,16,2,power_law_1.2,0.07315840125083924
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,7168,2048,8,384,16,2,power_law_1.2,0.09500160217285156
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,7168,2048,8,384,16,2,power_law_1.2,0.12350080013275147
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,7168,2048,8,384,16,2,power_law_1.2,0.1343168020248413
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,7168,2048,8,384,16,2,power_law_1.2,0.16542719602584838
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,7168,2048,8,384,16,2,power_law_1.2,0.17875200510025024
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,7168,2048,8,384,16,2,power_law_1.2,0.18248319625854492
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,7168,2048,8,384,16,2,power_law_1.2,0.1969599962234497
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,7168,2048,8,384,16,2,power_law_1.2,0.21557118892669677
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,7168,2048,8,384,16,2,power_law_1.2,0.22112638950347902
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,7168,2048,8,384,16,2,power_law_1.2,0.23445119857788085
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,7168,2048,8,384,16,2,power_law_1.2,0.2620543956756592
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,7168,2048,8,384,16,2,power_law_1.2,0.27684481143951417
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,7168,2048,8,384,16,2,power_law_1.2,0.284172797203064
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,7168,2048,8,384,16,2,power_law_1.2,0.34284799098968505
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,384,16,2,balanced,19.70505650838216
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,7168,2048,8,384,16,2,power_law_1.2,0.38847999572753905
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,7168,2048,8,384,16,2,power_law_1.2,0.48631038665771487
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,7168,2048,8,384,16,2,power_law_1.2,0.5330239772796631
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,7168,2048,8,384,16,2,power_law_1.2,0.676800012588501
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,7168,2048,8,384,16,2,power_law_1.2,0.8133695602416993
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,7168,2048,8,384,16,2,power_law_1.2,1.07194242477417
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,7168,2048,8,384,16,2,power_law_1.2,1.4018688201904297
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,7168,2048,8,384,16,2,power_law_1.2,1.9593856811523438
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,7168,2048,8,384,16,2,power_law_1.2,2.611756706237793
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,7168,2048,8,384,16,2,power_law_1.2,3.236102294921875
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,7168,2048,8,384,16,2,power_law_1.2,4.764108657836914
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,7168,2048,8,384,16,2,power_law_1.2,10.21313247680664
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,7168,2048,8,384,32,1,balanced,0.06730666756629944
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,7168,2048,8,384,32,1,balanced,0.07980266710122426
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,7168,2048,8,384,32,1,balanced,0.09244267145792644
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,7168,2048,8,384,32,1,balanced,0.12717333436012268
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,7168,2048,8,384,32,1,balanced,0.18525334199269614
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,7168,2048,8,384,16,2,power_law_1.2,0.09548159837722778
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,7168,2048,8,384,32,1,balanced,0.29185599088668823
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,7168,2048,8,384,32,1,balanced,0.41015998522440594
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,7168,2048,8,384,16,2,power_law_1.2,0.10389120578765869
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,7168,2048,8,384,32,1,balanced,0.418287992477417
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,7168,2048,8,384,32,1,balanced,0.42244799931844074
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,7168,2048,8,384,16,2,power_law_1.2,0.11356159448623657
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,7168,2048,8,384,32,1,balanced,0.424293319384257
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,7168,2048,8,384,16,2,power_law_1.2,0.122707200050354
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,7168,2048,8,384,32,1,balanced,0.42244799931844074
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,7168,2048,8,384,32,1,balanced,0.4307946761449178
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,7168,2048,8,384,16,2,power_law_1.2,0.13602559566497802
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,7168,2048,8,384,32,1,balanced,0.061530664563179016
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,7168,2048,8,384,32,1,balanced,0.4367893139521281
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,7168,2048,8,384,16,2,power_law_1.2,0.1613312005996704
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,7168,2048,8,384,32,1,balanced,0.4445813496907552
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,7168,2048,8,384,32,1,balanced,0.06854933500289917
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,7168,2048,8,384,32,1,balanced,0.454800009727478
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,7168,2048,8,384,16,2,power_law_1.2,0.18773119449615477
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,7168,2048,8,384,32,1,balanced,0.07918933530648549
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,7168,2048,8,384,32,1,balanced,0.4610399802525838
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,7168,2048,8,384,16,2,power_law_1.2,0.2203007936477661
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,7168,2048,8,384,32,1,balanced,0.11171733339627583
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,7168,2048,8,384,32,1,balanced,0.4783253272374471
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,7168,2048,8,384,32,1,balanced,0.16141866644223532
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,7168,2048,8,384,16,2,power_law_1.2,0.23040640354156494
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,7168,2048,8,384,32,1,balanced,0.5329813162485758
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,7168,2048,8,384,32,1,balanced,0.26412800947825116
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,7168,2048,8,384,32,1,balanced,0.5802773237228394
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,7168,2048,8,384,16,2,power_law_1.2,0.23672959804534913
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,7168,2048,8,384,32,1,balanced,0.3646453221638997
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,7168,2048,8,384,32,1,balanced,0.36735467116038006
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,7168,2048,8,384,32,1,balanced,0.6739892959594727
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,7168,2048,8,384,16,2,power_law_1.2,0.25397119522094724
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,7168,2048,8,384,32,1,balanced,0.3691466649373372
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,7168,2048,8,384,32,1,balanced,0.8368639945983887
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,7168,2048,8,384,16,2,power_law_1.2,0.2743680000305176
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,7168,2048,8,384,32,1,balanced,0.37196799119313556
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,7168,2048,8,384,32,1,balanced,0.37644799550374347
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,7168,2048,8,384,16,2,power_law_1.2,0.2908927917480469
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,7168,2048,8,384,32,1,balanced,0.9814933141072592
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,7168,2048,8,384,32,1,balanced,0.3814506530761719
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,7168,2048,8,384,16,2,power_law_1.2,0.3166975975036621
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,7168,2048,8,384,32,1,balanced,0.3869333267211914
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,7168,2048,8,384,16,2,power_law_1.2,0.33914239406585694
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,7168,2048,8,384,32,1,balanced,0.39971200625101727
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,7168,2048,8,384,32,1,balanced,1.2367573579152424
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,7168,2048,8,384,16,2,power_law_1.2,0.37500801086425783
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,7168,2048,8,384,32,1,balanced,0.40600534280141193
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,7168,2048,8,384,32,1,balanced,0.42178134123484295
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,7168,2048,8,384,16,2,power_law_1.2,0.4285696029663086
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,7168,2048,8,384,32,1,balanced,1.664954662322998
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,7168,2048,8,384,32,1,balanced,0.4452586571375529
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,7168,2048,8,384,16,2,power_law_1.2,0.5545087814331054
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,7168,2048,8,384,32,1,balanced,0.4846666653951009
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,7168,2048,8,384,32,1,balanced,0.5579573313395182
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,384,16,2,power_law_1.2,0.652569580078125
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,7168,2048,8,384,32,1,balanced,2.218437353769938
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,7168,2048,8,384,32,1,power_law_1.01,0.055251199007034305
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,7168,2048,8,384,32,1,power_law_1.01,0.06159359812736511
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,7168,2048,8,384,32,1,balanced,0.6462080081303915
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,7168,2048,8,384,32,1,power_law_1.01,0.064300799369812
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,7168,2048,8,384,32,1,power_law_1.01,0.07538560032844543
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,7168,2048,8,384,32,1,balanced,0.7695840199788412
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,384,16,2,power_law_1.2,0.7953023910522461
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,7168,2048,8,384,32,1,power_law_1.01,0.0745855987071991
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,7168,2048,8,384,32,1,power_law_1.01,0.08799359798431397
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,384,16,2,power_law_1.2,0.9517631530761719
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,7168,2048,8,384,32,1,power_law_1.01,0.09386879801750184
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,7168,2048,8,384,32,1,power_law_1.01,0.10594559907913208
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,7168,2048,8,384,32,1,balanced,0.9239733219146729
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,384,16,2,power_law_1.2,1.3435071945190429
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,7168,2048,8,384,32,1,power_law_1.01,0.1306048035621643
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,7168,2048,8,384,32,1,balanced,3.083594640096029
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,7168,2048,8,384,32,1,power_law_1.01,0.15180799961090088
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,384,16,2,power_law_1.2,1.6588735580444336
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,7168,2048,8,384,32,1,power_law_1.01,0.17287039756774902
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,7168,2048,8,384,32,1,power_law_1.01,0.19133440256118775
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,7168,2048,8,384,32,1,balanced,1.153007984161377
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,7168,2048,8,384,32,1,power_law_1.01,0.2026815891265869
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,384,16,2,power_law_1.2,2.3725248336791993
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,7168,2048,8,384,32,1,power_law_1.01,0.22043519020080565
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,7168,2048,8,384,32,1,power_law_1.01,0.2475519895553589
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,7168,2048,8,384,32,1,power_law_1.01,0.2822016000747681
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,384,16,2,power_law_1.2,3.0079296112060545
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,7168,2048,8,384,32,1,power_law_1.01,0.26039040088653564
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,7168,2048,8,384,32,1,balanced,1.6054080327351887
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,7168,2048,8,384,32,1,power_law_1.01,0.29872000217437744
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,384,16,2,power_law_1.2,4.240832138061523
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,7168,2048,8,384,32,1,power_law_1.01,0.26800639629364015
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,7168,2048,8,384,32,1,power_law_1.01,0.31393280029296877
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,7168,2048,8,384,32,1,balanced,3.898341178894043
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,7168,2048,8,384,32,1,power_law_1.01,0.2857919931411743
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,384,16,2,power_law_1.2,5.5444286346435545
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,7168,2048,8,384,32,1,power_law_1.01,0.33267199993133545
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,7168,2048,8,384,32,1,power_law_1.01,0.30279040336608887
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,7168,2048,8,384,32,1,power_law_1.01,0.3470911979675293
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,7168,2048,8,384,32,1,balanced,2.151498635609945
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,384,16,2,power_law_1.2,7.289190673828125
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,7168,2048,8,384,32,1,power_law_1.01,0.32705280780792234
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,7168,2048,8,384,32,1,power_law_1.01,0.3624703884124756
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,7168,2048,8,384,32,1,power_law_1.01,0.3512703895568848
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,7168,2048,8,384,32,1,power_law_1.01,0.3857599973678589
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,384,16,2,power_law_1.2,10.892486572265625
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,7168,2048,8,384,32,1,power_law_1.01,0.37574400901794436
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,7168,2048,8,384,32,1,power_law_1.01,0.4063744068145752
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,7168,2048,8,384,32,1,power_law_1.01,0.3989311933517456
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,7168,2048,8,384,32,1,power_law_1.01,0.42287359237670896
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,384,16,2,power_law_1.2,20.564044189453124
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,7168,2048,8,384,32,1,power_law_1.01,0.4207808017730713
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,7168,2048,8,384,32,1,balanced,3.0726613998413086
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,7168,2048,8,384,32,1,power_law_1.01,0.4654975891113281
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,7168,2048,8,384,32,1,power_law_1.01,0.5039872169494629
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,7168,2048,8,384,32,1,power_law_1.01,0.5473023891448975
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,7168,2048,8,384,32,1,balanced,4.872122764587402
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,7168,2048,8,384,32,1,power_law_1.01,0.5847231864929199
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,7168,2048,8,384,32,1,power_law_1.01,3.239904022216797
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,7168,2048,8,384,32,1,power_law_1.01,0.7285568237304687
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,7168,2048,8,384,32,1,power_law_1.01,3.388127899169922
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,7168,2048,8,384,32,1,power_law_1.01,0.7750144004821777
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,7168,2048,8,384,32,1,power_law_1.01,0.868012809753418
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,7168,2048,8,384,32,1,power_law_1.01,0.9822976112365722
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,7168,2048,8,384,32,1,power_law_1.01,1.064134407043457
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,7168,2048,8,384,32,1,balanced,3.8515307108561196
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,7168,2048,8,384,32,1,power_law_1.01,1.1913408279418944
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,7168,2048,8,384,32,1,power_law_1.01,1.2817472457885741
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,7168,2048,8,384,32,1,power_law_1.01,1.6218944549560548
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,7168,2048,8,384,32,1,power_law_1.01,1.728166389465332
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,7168,2048,8,384,32,1,power_law_1.01,2.080761528015137
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,7168,2048,8,384,32,1,power_law_1.01,2.129267120361328
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,7168,2048,8,384,32,1,power_law_1.01,2.9775615692138673
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,7168,2048,8,384,32,1,power_law_1.01,3.0337215423583985
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,7168,2048,8,384,32,1,power_law_1.01,3.9040576934814455
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,7168,2048,8,384,32,1,power_law_1.01,3.866284942626953
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,7168,2048,8,384,32,1,balanced,7.449258804321289
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,7168,2048,8,384,32,1,power_law_1.01,4.773612976074219
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,7168,2048,8,384,32,1,power_law_1.01,4.715232086181641
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,7168,2048,8,384,32,1,balanced,4.851408004760742
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,7168,2048,8,384,32,1,power_law_1.01,7.287007904052734
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,7168,2048,8,384,32,1,power_law_1.01,7.531270599365234
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,7168,2048,8,384,32,1,power_law_1.01,15.555416870117188
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,7168,2048,8,384,32,1,power_law_1.01,15.497062683105469
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,7168,2048,8,384,32,1,power_law_1.2,0.061478400230407716
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,7168,2048,8,384,32,1,power_law_1.2,0.06896640062332153
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,7168,2048,8,384,32,1,power_law_1.2,0.07611520290374756
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,7168,2048,8,384,32,1,power_law_1.2,0.10806399583816528
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,7168,2048,8,384,32,1,power_law_1.2,0.14469759464263915
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,7168,2048,8,384,32,1,balanced,7.476128260294597
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,7168,2048,8,384,32,1,power_law_1.2,0.17909120321273803
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,7168,2048,8,384,32,1,power_law_1.2,0.20139520168304442
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,7168,2048,8,384,32,1,power_law_1.2,0.2871551990509033
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,7168,2048,8,384,32,1,power_law_1.2,0.29950718879699706
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,7168,2048,8,384,32,1,power_law_1.2,0.30205440521240234
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,7168,2048,8,384,32,1,power_law_1.2,0.3079360008239746
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,7168,2048,8,384,32,1,power_law_1.2,0.3277375936508179
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,7168,2048,8,384,32,1,power_law_1.2,0.3618367910385132
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,7168,2048,8,384,32,1,power_law_1.2,0.3873408079147339
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,7168,2048,8,384,32,1,power_law_1.2,0.4074560165405273
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,7168,2048,8,384,32,1,balanced,14.188821156819662
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,7168,2048,8,384,32,1,power_law_1.2,0.4189760208129883
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,7168,2048,8,384,32,1,power_law_1.2,0.477510404586792
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,7168,2048,8,384,32,1,power_law_1.2,0.5654592037200927
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,7168,2048,8,384,32,1,power_law_1.2,3.495404815673828
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,7168,2048,8,384,32,1,power_law_1.2,3.66497917175293
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,7168,2048,8,384,32,1,power_law_1.2,0.9171135902404786
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,7168,2048,8,384,32,1,power_law_1.2,1.1213567733764649
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,7168,2048,8,384,32,1,power_law_1.2,1.3552512168884276
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,7168,2048,8,384,32,1,power_law_1.2,1.7902143478393555
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,7168,2048,8,384,32,1,power_law_1.2,2.182003211975098
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,7168,2048,8,384,32,1,power_law_1.2,3.11147518157959
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,7168,2048,8,384,32,1,balanced,14.527205149332682
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,7168,2048,8,384,32,1,power_law_1.2,3.8697662353515625
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,7168,2048,8,384,32,1,power_law_1.2,0.055340802669525145
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,7168,2048,8,384,32,1,power_law_1.2,4.701926422119141
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,7168,2048,8,384,32,1,power_law_1.2,0.06430720090866089
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,7168,2048,8,384,32,1,power_law_1.2,0.07220479846000671
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,7168,2048,8,384,32,1,power_law_1.2,7.566041564941406
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,7168,2048,8,384,32,1,power_law_1.2,0.09143679738044738
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,7168,2048,8,384,32,1,power_law_1.2,0.12328319549560547
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,7168,2048,8,384,32,1,power_law_1.2,15.708589172363281
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,7168,2048,8,384,32,1,power_law_1.2,0.1579967975616455
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,7168,2048,8,384,32,1,power_law_1.2,0.18585599660873414
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,7168,2048,8,384,32,1,power_law_1.2,0.2360703945159912
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,7168,2048,8,384,32,1,power_law_1.2,0.25489919185638427
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,7168,2048,8,384,32,1,power_law_1.2,0.26439039707183837
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,7168,2048,8,384,32,1,power_law_1.2,0.28562560081481936
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,7168,2048,8,384,32,1,power_law_1.2,0.30481278896331787
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,7168,2048,8,384,32,1,power_law_1.2,0.3209791898727417
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,7168,2048,8,384,32,1,power_law_1.2,0.351200008392334
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,7168,2048,8,384,32,1,power_law_1.2,0.3806335926055908
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,7168,2048,8,384,32,1,power_law_1.2,0.40120959281921387
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,7168,2048,8,384,32,1,power_law_1.2,0.41822080612182616
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,7168,2048,8,384,32,1,power_law_1.2,0.5159872055053711
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,7168,2048,8,384,32,1,power_law_1.2,0.5892672061920166
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,7168,2048,8,384,32,1,power_law_1.2,0.741209602355957
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,7168,2048,8,384,32,1,power_law_1.2,0.8110783576965332
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,7168,2048,8,384,32,1,power_law_1.2,1.0354047775268556
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,7168,2048,8,384,32,1,power_law_1.2,1.2535552024841308
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,7168,2048,8,384,32,1,power_law_1.2,1.683456039428711
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,128,1,32,balanced,0.05796800057093302
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,128,1,32,power_law_1.01,0.10183680057525635
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,7168,2048,8,384,32,1,power_law_1.2,2.1550912857055664
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,128,1,32,balanced,0.05894933144251505
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,128,1,32,power_law_1.01,0.08548480272293091
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,128,1,32,balanced,0.05855466425418854
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,7168,2048,8,384,32,1,power_law_1.2,3.0535743713378904
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,128,1,32,power_law_1.01,0.065830397605896
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,128,1,32,balanced,0.05454933146635691
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,7168,2048,8,384,32,1,power_law_1.2,3.9329151153564452
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,128,1,32,balanced,0.06638933221499126
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,128,1,32,power_law_1.01,0.057107198238372806
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,128,1,32,power_law_1.2,0.10151040554046631
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,128,1,32,balanced,0.07948799928029378
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,128,1,32,power_law_1.01,0.06807039976119995
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,7168,2048,8,384,32,1,power_law_1.2,4.7910400390625
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,128,1,32,balanced,0.08751466870307922
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,128,1,32,power_law_1.2,0.0865664005279541
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,128,1,32,power_law_1.01,0.07827839851379395
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,128,1,32,balanced,0.08808533350626628
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,128,1,32,power_law_1.2,0.0598143994808197
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,128,1,32,power_law_1.01,0.08352000117301941
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,7168,2048,8,384,32,1,power_law_1.2,7.339750671386719
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,128,1,32,balanced,0.12396267056465149
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,128,1,32,power_law_1.2,0.0585536003112793
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,128,1,32,power_law_1.01,0.07927039861679078
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,128,1,32,balanced,0.12353066603342693
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,128,1,32,power_law_1.2,0.06776959896087646
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,128,1,32,balanced,0.12146666646003723
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,128,1,32,power_law_1.01,0.12057600021362305
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,7168,2048,8,384,32,1,power_law_1.2,15.913958740234374
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,128,1,32,power_law_1.2,0.07641599774360656
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,128,1,32,balanced,0.11918399731318156
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,128,1,32,power_law_1.01,0.11934080123901367
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,128,1,32,balanced,0.11777599652608235
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,128,1,32,power_law_1.2,0.0821120023727417
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,128,1,32,power_law_1.01,0.11006079912185669
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,128,1,32,balanced,0.11658133069674174
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,128,1,32,power_law_1.2,0.08465920090675354
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,128,1,32,power_law_1.01,0.11829119920730591
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,128,1,32,balanced,0.11549333731333415
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,128,1,32,power_law_1.2,0.12092159986495972
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,128,1,32,power_law_1.01,0.11977599859237671
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,128,1,32,balanced,0.11653866370519002
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,128,1,32,power_law_1.2,0.12023040056228637
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,128,1,32,power_law_1.01,0.11759999990463257
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,128,1,32,balanced,0.11762133240699768
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,128,1,32,power_law_1.2,0.12456320524215699
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,128,1,32,power_law_1.01,0.11827839612960815
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,128,1,32,power_law_1.2,0.11242239475250244
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,128,1,32,balanced,0.12086400389671326
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,128,1,32,power_law_1.01,0.1160256028175354
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,128,1,32,power_law_1.2,0.1186303973197937
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,128,1,32,balanced,0.12354133526484172
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,128,1,32,power_law_1.01,0.12054400444030762
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,128,1,32,power_law_1.2,0.111571204662323
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,128,1,32,balanced,0.1307253340880076
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,128,2,16,balanced,0.04692799846331278
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,128,1,32,power_law_1.2,0.11780480146408082
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,128,1,32,power_law_1.01,0.12327040433883667
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,128,2,16,balanced,0.04929066697756449
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,128,1,32,balanced,0.13726933797200522
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,128,1,32,power_law_1.2,0.12329599857330323
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,128,1,32,power_law_1.01,0.14787839651107787
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,128,2,16,balanced,0.049072002371152244
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,128,1,32,balanced,0.15340266625086466
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,128,1,32,power_law_1.2,0.121452796459198
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,128,1,32,power_law_1.01,0.19791359901428224
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,128,2,16,balanced,0.04949333270390829
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,128,1,32,power_law_1.2,0.14725120067596437
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,128,1,32,power_law_1.01,0.21040000915527343
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,128,2,16,balanced,0.04353600243727366
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,128,1,32,balanced,0.1721280018488566
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,128,1,32,power_law_1.2,0.18839679956436156
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,128,2,16,balanced,0.058490668733914696
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,128,1,32,power_law_1.01,0.2853568077087402
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,128,1,32,power_law_1.2,0.2116544008255005
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,128,2,16,balanced,0.06253333389759064
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,128,1,32,power_law_1.01,0.40675840377807615
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,128,1,32,balanced,0.280021329720815
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,128,2,16,balanced,0.06400000055631001
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,128,1,32,power_law_1.2,0.25303680896759034
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,128,1,32,power_law_1.01,0.4726463794708252
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,128,2,16,balanced,0.07186133166154225
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,128,1,32,power_law_1.2,0.34281599521636963
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,128,1,32,power_law_1.01,0.6395584106445312
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,128,2,16,balanced,0.07307733098665874
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,128,1,32,balanced,0.31724266211191815
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,128,1,32,power_law_1.2,0.5149759769439697
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,128,1,32,power_law_1.01,1.1035648345947267
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,128,2,16,balanced,0.07282666862010956
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,128,1,32,power_law_1.2,0.6187647819519043
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,128,1,32,power_law_1.01,1.462611198425293
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,128,2,16,balanced,0.121370663245519
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,128,1,32,power_law_1.2,0.7996096134185791
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,128,2,16,balanced,0.12090667088826497
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,128,1,32,power_law_1.2,1.271827220916748
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,128,1,32,balanced,0.46319464842478436
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,128,2,16,power_law_1.01,0.07182080149650574
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,128,1,32,power_law_1.01,1.7968320846557617
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,128,2,16,balanced,0.12043733398119609
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,128,1,32,power_law_1.2,1.6580799102783204
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,128,2,16,power_law_1.01,0.08944000005722046
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,128,2,16,balanced,0.12074666221936543
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,128,1,32,power_law_1.01,2.604172706604004
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,128,2,16,power_law_1.01,0.060864001512527466
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,128,1,32,power_law_1.2,1.905196762084961
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,128,2,16,power_law_1.01,0.05443199872970581
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,128,2,16,balanced,0.12171733379364014
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,128,2,16,power_law_1.01,0.05086719989776611
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,128,1,32,power_law_1.2,4.239878463745117
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,128,1,32,power_law_1.01,4.861548614501953
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,128,1,32,balanced,0.606058677037557
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,128,2,16,balanced,0.1225226620833079
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,128,2,16,power_law_1.01,0.05319679975509643
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,128,2,16,balanced,0.12589866916338602
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,128,2,16,power_law_1.01,0.06220160126686096
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,128,1,32,power_law_1.2,8.262067413330078
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,128,2,16,power_law_1.01,0.06058239936828613
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,128,2,16,balanced,0.12846933801968893
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,128,2,16,power_law_1.01,0.07148159742355346
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,128,2,16,power_law_1.01,0.07314559817314148
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,128,2,16,balanced,0.1360640029112498
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,128,2,16,power_law_1.01,0.07317119836807251
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,128,2,16,power_law_1.2,0.07070720195770264
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,128,1,32,balanced,0.7496480147043864
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,128,2,16,power_law_1.01,0.12200319766998291
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,128,2,16,balanced,0.14235732952753702
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,128,2,16,power_law_1.2,0.08220800161361694
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,128,2,16,power_law_1.01,0.12167680263519287
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,128,2,16,power_law_1.01,0.12244479656219483
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,128,2,16,balanced,0.15826132893562317
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,128,2,16,power_law_1.2,0.054118400812149046
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,128,2,16,power_law_1.01,0.12149759531021118
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,128,2,16,power_law_1.01,0.12354559898376465
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,128,2,16,power_law_1.2,0.05124480128288269
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,128,2,16,balanced,0.17228267590204874
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,128,2,16,power_law_1.01,0.12646399736404418
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,128,2,16,power_law_1.2,0.05319679975509643
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,128,2,16,power_law_1.01,0.13155200481414794
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,128,2,16,power_law_1.01,0.14106240272521972
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,128,2,16,power_law_1.2,0.05432320237159729
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,128,2,16,balanced,0.2746293346087138
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,128,2,16,power_law_1.01,0.16873600482940673
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,128,1,32,balanced,1.1815679868062336
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,128,2,16,power_law_1.2,0.061587202548980716
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,128,2,16,power_law_1.01,0.18624000549316405
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,128,2,16,power_law_1.2,0.062054401636123656
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,128,2,16,power_law_1.01,0.2525504112243652
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,128,2,16,balanced,0.31349867582321167
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,128,2,16,power_law_1.01,0.3158400058746338
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,128,2,16,power_law_1.2,0.07207040190696716
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,128,2,16,power_law_1.01,0.3965696096420288
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,128,2,16,power_law_1.2,0.07242239713668823
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,128,2,16,power_law_1.01,0.5272128105163574
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,128,2,16,power_law_1.2,0.0717631995677948
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,128,2,16,power_law_1.01,0.7840191841125488
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,128,2,16,balanced,0.45629334449768066
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,128,2,16,power_law_1.2,0.1217087984085083
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,128,2,16,power_law_1.01,0.9533247947692871
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,128,2,16,power_law_1.2,0.121561598777771
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,128,2,16,power_law_1.01,1.179980754852295
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,128,2,16,power_law_1.2,0.12550400495529174
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,128,2,16,power_law_1.01,1.9396032333374023
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,128,2,16,power_law_1.2,0.12378239631652832
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,128,2,16,power_law_1.01,3.8092929840087892
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,128,2,16,balanced,0.5964959859848022
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,128,2,16,power_law_1.2,0.11547520160675048
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,128,2,16,power_law_1.2,0.12683520317077637
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,128,2,16,power_law_1.2,0.13231359720230101
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,128,2,16,power_law_1.2,0.14054399728775024
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,128,1,32,balanced,2.333914597829183
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,128,2,16,power_law_1.2,0.1841279983520508
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,128,2,16,balanced,0.7383733590443929
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,128,2,16,power_law_1.2,0.21544320583343507
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,128,2,16,power_law_1.2,0.26384639739990234
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,128,2,16,power_law_1.2,0.3650239944458008
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,128,2,16,power_law_1.2,0.4799808025360107
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,128,2,16,power_law_1.2,0.6640255928039551
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,128,4,8,balanced,0.033402666449546814
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,128,2,16,balanced,1.1670133272806804
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,128,2,16,power_law_1.2,0.9722559928894043
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,128,4,8,balanced,0.035162667433420815
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,128,4,8,balanced,0.03696533292531967
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,128,2,16,power_law_1.2,1.3138751983642578
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,128,4,8,balanced,0.04111466556787491
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,128,2,16,power_law_1.2,1.5741951942443848
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,128,4,8,balanced,0.05009066561857859
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,128,4,8,balanced,0.05776533484458923
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,128,2,16,power_law_1.2,2.566668891906738
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,128,4,8,balanced,0.058559998869895935
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,128,4,8,power_law_1.01,0.0349375993013382
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,128,2,16,power_law_1.2,5.592185592651367
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,128,4,8,balanced,0.058335999647776283
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,128,4,8,balanced,0.06016000111897787
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,128,4,8,power_law_1.01,0.04200319945812225
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,128,4,8,balanced,0.06081066528956095
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,128,4,8,power_law_1.01,0.03868800103664398
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,128,4,8,balanced,0.0609386662642161
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,128,4,8,power_law_1.01,0.04687359929084778
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,128,4,8,balanced,0.07410133381684621
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,128,4,8,power_law_1.01,0.04718720018863678
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,128,4,8,balanced,0.07429333527882893
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,128,4,8,power_law_1.01,0.05431039929389954
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,128,4,8,balanced,0.07397866745789845
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,128,2,16,balanced,2.290719985961914
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,128,4,8,power_law_1.01,0.05559039711952209
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,128,4,8,balanced,0.11506666739781697
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,128,4,8,power_law_1.01,0.056569600105285646
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,128,4,8,balanced,0.11521066228548686
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,128,4,8,power_law_1.01,0.05916799902915955
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,128,4,8,balanced,0.11691199739774068
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,128,4,8,power_law_1.01,0.059443199634552
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,128,4,8,balanced,0.12030933300654094
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,128,4,8,power_law_1.01,0.06039680242538452
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,128,4,8,balanced,0.12349866827329
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,128,4,8,power_law_1.01,0.0722815990447998
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,128,4,8,balanced,0.1328053375085195
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,128,4,8,power_law_1.01,0.07155200242996215
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,128,4,8,balanced,0.1404853363831838
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,128,4,8,power_law_1.01,0.07290239930152893
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,128,4,8,balanced,0.15968533356984457
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,128,4,8,power_law_1.01,0.11892479658126831
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,128,4,8,balanced,0.17638933658599854
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,128,4,8,power_law_1.01,0.11772160530090332
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,128,4,8,power_law_1.01,0.11989120244979859
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,128,4,8,balanced,0.27455466985702515
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,128,4,8,power_law_1.01,0.12388479709625244
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,128,4,8,power_law_1.01,0.1373952031135559
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,128,4,8,power_law_1.01,0.1513216018676758
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,128,4,8,balanced,0.31202133496602374
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,128,4,8,power_law_1.01,0.18354560136795045
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,128,4,8,power_law_1.01,0.2255295991897583
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,128,4,8,power_law_1.01,0.27289600372314454
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,128,4,8,balanced,0.45235733191172284
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,128,4,8,power_law_1.01,0.35793280601501465
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,128,8,4,balanced,0.02917333443959554
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,128,4,8,power_law_1.01,0.4830848217010498
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,128,4,8,power_law_1.2,0.03531520068645477
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,128,8,4,balanced,0.03252800057331721
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,128,4,8,power_law_1.01,0.6581503868103027
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,128,4,8,balanced,0.5906240145365397
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,128,4,8,power_law_1.2,0.04229120016098022
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,128,8,4,balanced,0.03270933280388514
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,128,4,8,power_law_1.01,0.8660608291625976
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,128,8,4,balanced,0.0393653338154157
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,128,4,8,power_law_1.2,0.03779839873313904
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,128,4,8,power_law_1.01,0.9873023986816406
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,128,8,4,balanced,0.0446720023949941
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,128,4,8,power_law_1.2,0.04556800127029419
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,128,8,4,balanced,0.05898133416970571
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,128,4,8,power_law_1.01,1.6132991790771485
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,128,4,8,power_law_1.2,0.0469760000705719
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,128,8,4,balanced,0.058101331194241844
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,128,4,8,balanced,0.7304800351460775
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,128,4,8,power_law_1.2,0.053324800729751584
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,128,4,8,power_law_1.01,3.1202239990234375
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,128,8,4,balanced,0.05807999769846598
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,128,4,8,power_law_1.2,0.056627202033996585
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,128,8,4,balanced,0.058330665032068886
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,128,4,8,power_law_1.2,0.05603839755058289
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,128,8,4,balanced,0.05855466425418854
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,128,8,4,balanced,0.05933333436648051
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,128,4,8,power_law_1.2,0.05952640175819397
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,128,8,4,balanced,0.0634986658891042
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,128,4,8,power_law_1.2,0.05896959900856018
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,128,8,4,balanced,0.06356266637643178
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,128,8,4,power_law_1.01,0.030399999022483824
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,128,4,8,power_law_1.2,0.05950719714164734
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,128,8,4,balanced,0.06425066788991292
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,128,4,8,balanced,1.1487733523050945
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,128,4,8,power_law_1.2,0.07187839746475219
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,128,8,4,power_law_1.01,0.03416320085525513
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,128,8,4,balanced,0.07539733250935872
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,128,4,8,power_law_1.2,0.07354879975318909
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,128,8,4,power_law_1.01,0.03518719971179962
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,128,8,4,balanced,0.07667199770609538
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,128,4,8,power_law_1.2,0.07423999905586243
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,128,8,4,power_law_1.01,0.04092159867286682
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,128,8,4,balanced,0.0779306689898173
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,128,4,8,power_law_1.2,0.1165120005607605
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,128,8,4,power_law_1.01,0.046854400634765626
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,128,8,4,balanced,0.12966400384902954
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,128,4,8,power_law_1.2,0.12157440185546875
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,128,8,4,power_law_1.01,0.05134080052375793
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,128,8,4,balanced,0.13359999656677246
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,128,4,8,power_law_1.2,0.12910720109939575
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,128,8,4,power_law_1.01,0.054099202156066895
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,128,8,4,balanced,0.1421280006567637
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,128,4,8,power_law_1.2,0.13386240005493164
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,128,8,4,power_law_1.01,0.05464320182800293
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,128,8,4,power_law_1.2,0.030374398827552794
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,128,8,4,balanced,0.15075733264287314
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,128,8,4,power_law_1.01,0.055366402864456175
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,128,4,8,power_law_1.2,0.14401919841766359
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,128,8,4,power_law_1.2,0.0341376006603241
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,128,8,4,power_law_1.01,0.05614719986915588
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,128,4,8,power_law_1.2,0.16136319637298585
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,128,8,4,power_law_1.2,0.0323199987411499
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,128,8,4,balanced,0.170799990495046
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,128,8,4,power_law_1.2,0.041875201463699344
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,128,8,4,power_law_1.01,0.056006401777267456
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,128,4,8,power_law_1.2,0.1950271964073181
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,128,8,4,power_law_1.2,0.04668160080909729
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,128,8,4,balanced,0.1874613364537557
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,128,8,4,power_law_1.01,0.061337602138519284
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,128,4,8,power_law_1.2,0.2577663898468018
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,128,8,4,power_law_1.2,0.04835839867591858
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,128,8,4,power_law_1.2,0.0542464017868042
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,128,8,4,power_law_1.01,0.061849600076675414
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,128,4,8,power_law_1.2,0.29780480861663816
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,128,4,8,balanced,2.2584959665934243
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,128,8,4,power_law_1.2,0.05494400262832642
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,128,8,4,balanced,0.2887893319129944
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,128,8,4,power_law_1.01,0.06282240152359009
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,128,4,8,power_law_1.2,0.395961594581604
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,128,8,4,power_law_1.2,0.053651201725006106
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,128,8,4,power_law_1.2,0.055743998289108275
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,128,8,4,power_law_1.01,0.07496320009231568
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,128,4,8,power_law_1.2,0.4973504066467285
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,128,8,4,power_law_1.2,0.05637120008468628
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,128,8,4,power_law_1.01,0.07633280158042907
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,128,8,4,balanced,0.3266400098800659
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,128,4,8,power_law_1.2,0.707583999633789
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,128,8,4,power_law_1.2,0.062028801441192626
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,128,8,4,power_law_1.2,0.06257280111312866
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,128,8,4,power_law_1.01,0.0785152018070221
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,128,4,8,power_law_1.2,1.0185728073120117
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,128,8,4,power_law_1.2,0.0642687976360321
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,128,8,4,power_law_1.01,0.12968319654464722
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,128,8,4,power_law_1.2,0.07592960000038147
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,128,4,8,power_law_1.2,1.1899840354919433
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,128,8,4,power_law_1.01,0.13855359554290772
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,128,8,4,power_law_1.2,0.07825919985771179
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,128,8,4,balanced,0.47886399428049725
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,128,16,2,balanced,0.02779199928045273
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,128,4,8,power_law_1.2,1.997612762451172
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,128,8,4,power_law_1.2,0.08255360126495362
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,128,8,4,power_law_1.01,0.15289599895477296
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,128,8,4,power_law_1.2,0.14019839763641356
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,128,16,2,balanced,0.03145066648721695
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,128,4,8,power_law_1.2,3.9639488220214845
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,128,8,4,power_law_1.01,0.17215360403060914
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,128,8,4,power_law_1.2,0.14507520198822021
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,128,16,2,balanced,0.032111999889214836
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,128,8,4,power_law_1.2,0.16821119785308838
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,128,8,4,power_law_1.01,0.21916160583496094
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,128,16,2,balanced,0.04022400081157684
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,128,8,4,power_law_1.2,0.1926591992378235
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,128,8,4,balanced,0.6191519896189371
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,128,8,4,power_law_1.01,0.24956159591674804
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,128,8,4,power_law_1.2,0.23824639320373536
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,128,16,2,balanced,0.05133866767088572
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,128,8,4,power_law_1.01,0.3560960054397583
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,128,8,4,power_law_1.2,0.2779839992523193
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,128,16,2,power_law_1.01,0.02821120023727417
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,128,8,4,power_law_1.2,0.3867199897766113
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,128,8,4,power_law_1.01,0.45669121742248536
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,128,16,2,balanced,0.06886933247248332
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,128,8,4,power_law_1.2,0.43928961753845214
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,128,16,2,power_law_1.01,0.031327998638153075
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,128,8,4,power_law_1.01,0.5987391948699952
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,128,16,2,balanced,0.06738666693369548
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,128,8,4,balanced,0.765338659286499
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,128,16,2,power_law_1.01,0.03260799944400787
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,128,8,4,power_law_1.2,0.6241792201995849
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,128,8,4,power_law_1.01,0.7884160041809082
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,128,16,2,balanced,0.06739200154940288
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,128,8,4,power_law_1.2,0.8862208366394043
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,128,16,2,power_law_1.01,0.04140160083770752
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,128,8,4,power_law_1.01,0.8893247604370117
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,128,16,2,balanced,0.06359466910362244
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,128,8,4,power_law_1.2,1.0439167976379395
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,128,16,2,power_law_1.01,0.04648320078849792
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,128,16,2,balanced,0.06402666866779327
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,128,8,4,power_law_1.01,1.4592831611633301
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,128,8,4,power_law_1.2,1.6403839111328125
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,128,16,2,balanced,0.06428800026575725
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,128,16,2,power_law_1.01,0.04906879961490631
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,128,8,4,power_law_1.01,2.7794496536254885
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,128,8,4,power_law_1.2,3.4590080261230467
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,128,16,2,balanced,0.0718453327814738
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,128,16,2,power_law_1.01,0.06039680242538452
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,128,16,2,balanced,0.07269333302974701
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,128,16,2,power_law_1.01,0.06117759943008423
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,128,8,4,balanced,1.1986400286356609
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,128,16,2,balanced,0.07257066667079926
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,128,16,2,power_law_1.01,0.05910400152206421
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,128,16,2,balanced,0.08166933556397755
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,128,16,2,power_law_1.01,0.06005120277404785
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,128,16,2,balanced,0.08237333099047343
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,128,16,2,power_law_1.01,0.061919999122619626
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,128,16,2,balanced,0.0848640004793803
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,128,16,2,power_law_1.01,0.07048320174217224
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,128,16,2,balanced,0.09437333544095357
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,128,16,2,power_law_1.01,0.07125120162963867
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,128,16,2,balanced,0.0990773340066274
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,128,16,2,power_law_1.01,0.07364479899406433
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,128,16,2,balanced,0.1730133295059204
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,128,16,2,power_law_1.01,0.08058879971504211
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,128,16,2,balanced,0.18228266636530557
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,128,16,2,power_law_1.01,0.08268160223960877
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,128,16,2,power_law_1.01,0.08552320003509521
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,128,16,2,balanced,0.20515199502309164
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,128,16,2,power_law_1.01,0.10865919589996338
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,128,16,2,balanced,0.22572267055511475
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,128,8,4,balanced,2.354095935821533
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,128,16,2,power_law_1.01,0.11847679615020752
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,128,16,2,power_law_1.01,0.20436480045318603
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,128,16,2,balanced,0.3771626551946004
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,128,16,2,power_law_1.01,0.22260479927062987
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,128,16,2,power_law_1.01,0.2657599925994873
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,128,16,2,balanced,0.4182933171590169
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,128,16,2,power_law_1.01,0.3252671957015991
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,128,16,2,power_law_1.2,0.027968001365661622
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,128,16,2,power_law_1.01,0.41969919204711914
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,128,16,2,power_law_1.2,0.031065601110458373
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,128,16,2,power_law_1.01,0.5204671859741211
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,128,16,2,balanced,0.6079946756362915
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,128,16,2,power_law_1.2,0.030604800581932066
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,128,16,2,power_law_1.01,0.706873607635498
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,128,16,2,power_law_1.2,0.040703999996185306
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,128,16,2,power_law_1.01,0.9601216316223145
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,128,16,2,power_law_1.2,0.04420480132102966
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,128,16,2,balanced,0.7949066956837972
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,128,16,2,power_law_1.2,0.049747198820114136
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,128,16,2,power_law_1.01,1.1471487998962402
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,128,16,2,power_law_1.2,0.06103039979934692
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,128,16,2,power_law_1.01,1.7726079940795898
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,128,16,2,power_law_1.2,0.06182399988174438
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,128,16,2,power_law_1.01,3.5837310791015624
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,128,16,2,power_law_1.2,0.059359997510910034
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,128,16,2,power_law_1.2,0.05912320017814636
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,128,16,2,balanced,0.9860693613688151
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,128,16,2,power_law_1.2,0.06164479851722717
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,128,16,2,power_law_1.2,0.07012479901313781
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,128,16,2,power_law_1.2,0.07214080095291138
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,128,16,2,power_law_1.2,0.07383679747581481
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,128,16,2,power_law_1.2,0.08135679960250855
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,128,16,2,power_law_1.2,0.0843392014503479
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,128,16,2,balanced,1.5428320566813152
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,128,16,2,power_law_1.2,0.08839679956436157
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,128,16,2,power_law_1.2,0.11390719413757325
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,128,32,1,balanced,0.024869332710901897
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,128,16,2,power_law_1.2,0.12175359725952148
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,128,16,2,power_law_1.2,0.20924160480499268
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,128,32,1,balanced,0.026543999711672466
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,128,32,1,balanced,0.028730665644009907
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,128,16,2,power_law_1.2,0.22985599040985108
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,128,32,1,balanced,0.035536001125971474
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,128,16,2,power_law_1.2,0.3051071882247925
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,128,32,1,balanced,0.04859200119972229
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,128,16,2,power_law_1.2,0.33527679443359376
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,128,32,1,balanced,0.07039999961853027
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,128,16,2,power_law_1.2,0.4255680084228516
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,128,32,1,power_law_1.01,0.02393600046634674
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,128,32,1,balanced,0.07135466734568278
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,128,16,2,power_law_1.2,0.5397183895111084
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,128,32,1,power_law_1.01,0.025830399990081788
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,128,16,2,power_law_1.2,0.7714111804962158
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,128,32,1,power_law_1.01,0.026092800498008727
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,128,32,1,balanced,0.06925866504510243
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,128,16,2,power_law_1.2,1.0339391708374024
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,128,32,1,power_law_1.01,0.03407360017299652
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,128,16,2,balanced,3.0334294637044272
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,128,16,2,power_law_1.2,1.194822406768799
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,128,32,1,power_law_1.01,0.04087679982185364
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,128,32,1,balanced,0.06977599859237671
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,128,16,2,power_law_1.2,1.7430591583251953
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,128,32,1,power_law_1.01,0.04716159999370575
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,128,32,1,balanced,0.06764266888300578
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,128,32,1,power_law_1.01,0.05750399827957153
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,128,32,1,balanced,0.06773333251476288
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,128,16,2,power_law_1.2,3.753945541381836
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,128,32,1,balanced,0.06507733464241028
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,128,32,1,power_law_1.01,0.05795199871063232
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,128,32,1,balanced,0.06492800017197926
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,128,32,1,power_law_1.01,0.05891839861869812
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,128,32,1,balanced,0.06669866542021434
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,128,32,1,power_law_1.01,0.06245120167732239
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,128,32,1,balanced,0.07495466868082683
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,128,32,1,power_law_1.01,0.06356480121612548
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,128,32,1,balanced,0.07715199887752533
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,128,32,1,power_law_1.01,0.06213759779930115
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,128,32,1,balanced,0.08011733492215474
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,128,32,1,power_law_1.2,0.02396160066127777
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,128,32,1,power_law_1.01,0.06273279786109924
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,128,32,1,balanced,0.09347732861836751
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,128,32,1,power_law_1.01,0.07422720193862915
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,128,32,1,power_law_1.2,0.025484800338745117
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,128,32,1,balanced,0.0993173321088155
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,128,32,1,power_law_1.01,0.07722880244255066
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,128,32,1,power_law_1.2,0.026547199487686156
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,128,32,1,power_law_1.01,0.08143360018730164
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,128,32,1,power_law_1.2,0.03330560028553009
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,128,32,1,balanced,0.12196266651153564
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,128,32,1,power_law_1.01,0.09516159892082214
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,128,32,1,power_law_1.2,0.04010240137577057
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,128,32,1,balanced,0.13395733634630838
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,128,32,1,power_law_1.01,0.10202879905700683
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,128,32,1,power_law_1.2,0.044352000951766966
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,128,32,1,balanced,0.23919999599456787
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,128,32,1,power_law_1.01,0.11836800575256348
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,128,32,1,power_law_1.2,0.0555840015411377
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,128,32,1,power_law_1.2,0.05715199708938599
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,128,32,1,power_law_1.01,0.15615999698638916
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,128,32,1,balanced,0.26375999053319293
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,128,32,1,power_law_1.2,0.06063359975814819
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,128,32,1,power_law_1.01,0.17909760475158693
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,128,32,1,balanced,0.4455840190251668
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,32,1,32,balanced,0.050666665037473045
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,128,32,1,power_law_1.2,0.06206079721450806
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,128,32,1,power_law_1.01,0.3002432107925415
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,32,1,32,power_law_1.01,0.049747198820114136
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,128,32,1,power_law_1.2,0.0636352002620697
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,128,32,1,power_law_1.01,0.3674943923950195
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,128,32,1,balanced,0.4946560064951579
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,128,32,1,power_law_1.2,0.06155520081520081
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,128,32,1,power_law_1.01,0.48273282051086425
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,32,1,32,balanced,0.05225066840648651
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,32,1,32,power_law_1.01,0.050387197732925416
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,128,32,1,power_law_1.2,0.06704639792442321
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,128,32,1,power_law_1.01,0.5907455921173096
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,128,32,1,power_law_1.2,0.07481600046157837
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,128,32,1,power_law_1.01,0.8079936027526855
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,32,1,32,balanced,0.05193066596984863
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,128,32,1,balanced,0.7186133066813151
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,32,1,32,power_law_1.01,0.050470399856567386
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,128,32,1,power_law_1.2,0.07767680287361145
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,128,32,1,power_law_1.01,1.0290752410888673
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,128,32,1,power_law_1.2,0.08214399814605713
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,128,32,1,power_law_1.01,1.2518464088439942
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,128,32,1,power_law_1.2,0.09609599709510804
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,32,1,32,balanced,0.05872533222039541
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,128,32,1,power_law_1.2,0.10368640422821045
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,128,32,1,power_law_1.01,1.905695915222168
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,32,1,32,power_law_1.01,0.054681599140167236
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,128,32,1,balanced,0.9417546590169271
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,128,32,1,power_law_1.2,0.12360320091247559
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,128,32,1,power_law_1.01,3.676403045654297
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,128,32,1,power_law_1.2,0.16166399717330932
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,128,32,1,power_law_1.2,0.18259840011596679
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,32,1,32,balanced,0.06253333389759064
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,128,32,1,power_law_1.2,0.32359039783477783
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,32,1,32,power_law_1.01,0.05795199871063232
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,128,32,1,balanced,1.1651679674784343
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,128,32,1,power_law_1.2,0.3730815887451172
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,128,32,1,power_law_1.2,0.49237761497497556
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,128,32,1,power_law_1.2,0.6018943786621094
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,128,32,1,power_law_1.2,0.8228992462158203
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,32,1,32,balanced,0.06990399956703186
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,128,32,1,power_law_1.2,1.0439552307128905
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,32,1,32,power_law_1.01,0.06793599724769592
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,128,32,1,power_law_1.2,1.2649663925170898
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,32,1,32,power_law_1.2,0.05015040040016174
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,128,32,1,balanced,1.8281866709391277
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,128,32,1,power_law_1.2,1.9176511764526367
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,32,1,32,power_law_1.2,0.0506816029548645
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,128,32,1,power_law_1.2,3.6885761260986327
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,32,1,32,power_law_1.2,0.050271999835968015
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,32,1,32,power_law_1.2,0.054739201068878175
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,32,1,32,power_law_1.2,0.05799679756164551
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,32,1,32,balanced,0.07086400190989177
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,32,1,32,power_law_1.01,0.06958720088005066
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,32,1,32,power_law_1.2,0.06762239933013917
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,32,1,32,balanced,0.07030400137106578
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,32,1,32,power_law_1.01,0.07000960111618042
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,32,1,32,power_law_1.2,0.07015039920806884
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,32,1,32,power_law_1.2,0.0704576015472412
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,32,1,32,balanced,0.08332266906897227
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,32,1,32,power_law_1.2,0.0831167995929718
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,32,1,32,balanced,0.08348799745241801
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,32,1,32,power_law_1.01,0.08263040184974671
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,32,1,32,power_law_1.2,0.08301439881324768
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,32,1,32,balanced,0.08415466547012329
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,32,1,32,balanced,0.08370133241017659
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,32,1,32,power_law_1.01,0.08263040184974671
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,32,1,32,power_law_1.2,0.08366079926490784
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,32,1,32,balanced,0.08431466420491536
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,128,32,1,balanced,3.5954720179239907
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,32,1,32,power_law_1.01,0.08296959996223449
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,32,1,32,power_law_1.2,0.08439040184020996
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,32,1,32,balanced,0.08525333801905315
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,32,1,32,power_law_1.01,0.08352000117301941
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,32,1,32,balanced,0.08566400408744812
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,32,1,32,power_law_1.2,0.0853056013584137
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,32,1,32,balanced,0.08612799644470215
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,32,1,32,power_law_1.01,0.08448640108108521
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,32,1,32,power_law_1.2,0.0869055986404419
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,32,1,32,balanced,0.0881813367207845
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,32,1,32,power_law_1.01,0.08600959777832032
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,32,1,32,balanced,0.0911253293355306
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,32,1,32,power_law_1.2,0.09983360171318054
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,32,1,32,power_law_1.01,0.0865664005279541
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,32,1,32,balanced,0.09405333797136943
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,32,1,32,power_law_1.2,0.10485759973526002
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,32,1,32,balanced,0.10172800223032634
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,32,1,32,power_law_1.01,0.09978880286216736
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,32,1,32,power_law_1.2,0.11306240558624267
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,32,1,32,power_law_1.01,0.11096960306167603
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,32,1,32,balanced,0.11179733276367188
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,32,1,32,power_law_1.2,0.16561919450759888
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,32,1,32,power_law_1.01,0.12851840257644653
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,32,1,32,balanced,0.14784533778826395
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,32,1,32,power_law_1.2,0.18288639783859253
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,32,1,32,power_law_1.01,0.14388480186462402
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,32,1,32,power_law_1.2,0.25077118873596194
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,32,1,32,balanced,0.16664000352223715
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,32,1,32,power_law_1.01,0.22305281162261964
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,32,2,16,balanced,0.04379733403523763
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,32,1,32,power_law_1.2,0.29180159568786623
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,32,2,16,power_law_1.01,0.05074560046195984
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,32,1,32,power_law_1.01,0.27151999473571775
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,32,1,32,balanced,0.2584106723467509
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,32,1,32,power_law_1.2,0.4647552013397217
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,32,1,32,power_law_1.01,0.39794559478759767
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,32,1,32,power_law_1.2,0.5780863761901855
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,32,2,16,balanced,0.04576533536116282
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,32,1,32,power_law_1.01,0.5435647964477539
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,32,2,16,power_law_1.01,0.04628480076789856
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,32,1,32,balanced,0.3098986744880676
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,32,1,32,power_law_1.2,0.8318719863891602
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,32,1,32,power_law_1.01,0.7566400051116944
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,32,2,16,balanced,0.04586666822433472
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,32,1,32,power_law_1.01,0.9438464164733886
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,32,2,16,power_law_1.01,0.04810880124568939
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,32,1,32,power_law_1.2,1.1143168449401855
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,32,2,16,balanced,0.04814399778842926
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,32,2,16,power_law_1.01,0.046086400747299194
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,32,1,32,power_law_1.2,1.6914112091064453
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,32,1,32,power_law_1.01,1.6274944305419923
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,32,1,32,balanced,0.4529973268508911
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,32,1,32,power_law_1.01,2.1084224700927736
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,32,1,32,power_law_1.2,2.2535423278808593
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,32,2,16,balanced,0.05078400174776713
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,32,2,16,power_law_1.01,0.0515392005443573
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,32,1,32,power_law_1.01,2.7020992279052733
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,32,1,32,power_law_1.2,2.811756706237793
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,32,1,32,power_law_1.2,4.4765888214111325
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,32,1,32,balanced,0.5949546496073405
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,32,1,32,power_law_1.01,4.168403244018554
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,32,2,16,balanced,0.05492799977461497
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,32,2,16,power_law_1.01,0.05537279844284058
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,32,1,32,power_law_1.2,8.910073852539062
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,32,1,32,power_law_1.01,8.759410858154297
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,32,1,32,balanced,0.7369386355082194
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,32,2,16,balanced,0.06030400097370148
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,32,2,16,power_law_1.01,0.0640447974205017
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,32,2,16,balanced,0.059562668204307556
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,32,2,16,power_law_1.01,0.06238080263137817
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,32,2,16,balanced,0.06727999945481618
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,32,2,16,power_law_1.01,0.06647040247917176
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,32,2,16,balanced,0.06729599833488464
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,32,2,16,power_law_1.01,0.06643840074539184
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,32,2,16,power_law_1.01,0.0667967975139618
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,32,2,16,balanced,0.06779199838638306
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,32,2,16,power_law_1.01,0.06705920100212097
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,32,2,16,balanced,0.06761600077152252
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,32,1,32,balanced,1.1665173371632893
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,32,2,16,power_law_1.01,0.06726400256156921
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,32,2,16,balanced,0.06835733354091644
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,32,2,16,power_law_1.01,0.06826239824295044
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,32,2,16,balanced,0.06884266436100006
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,32,2,16,power_law_1.01,0.06903679966926575
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,32,2,16,balanced,0.0691786656777064
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,32,2,16,power_law_1.2,0.050809597969055174
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,32,2,16,power_law_1.01,0.07014399766921997
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,32,2,16,balanced,0.0697920024394989
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,32,2,16,power_law_1.2,0.047814399003982544
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,32,2,16,power_law_1.01,0.07297279834747314
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,32,2,16,balanced,0.07144000132878621
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,32,2,16,power_law_1.2,0.04952960014343262
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,32,2,16,power_law_1.01,0.12108800411224366
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,32,2,16,power_law_1.2,0.05101439952850342
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,32,2,16,balanced,0.07468266785144806
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,32,2,16,power_law_1.2,0.05262719988822937
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,32,2,16,power_law_1.01,0.12438399791717529
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,32,2,16,balanced,0.080335999528567
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,32,2,16,power_law_1.2,0.05619199872016907
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,32,2,16,power_law_1.01,0.17057280540466307
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,32,2,16,balanced,0.087909330924352
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,32,2,16,power_law_1.2,0.060915201902389526
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,32,2,16,power_law_1.01,0.21220479011535645
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,32,2,16,power_law_1.2,0.06083199977874756
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,32,2,16,balanced,0.09474666913350423
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,32,2,16,power_law_1.01,0.30848639011383056
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,32,2,16,power_law_1.2,0.07006080150604248
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,32,1,32,balanced,2.3058719635009766
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,32,2,16,balanced,0.15315733353296915
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,32,2,16,power_law_1.01,0.36764800548553467
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,32,2,16,power_law_1.2,0.06660479903221131
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,32,2,16,power_law_1.01,0.5471360206604003
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,32,2,16,power_law_1.2,0.06696959733963012
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,32,2,16,balanced,0.16684800386428833
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,32,2,16,power_law_1.01,0.6970367908477784
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,32,2,16,power_law_1.2,0.06960639953613282
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,32,2,16,power_law_1.2,0.06832000017166137
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,32,2,16,power_law_1.01,1.1762880325317382
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,32,2,16,balanced,0.2412373423576355
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,32,4,8,balanced,0.03249066571394602
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,32,2,16,power_law_1.2,0.06849279999732971
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,32,4,8,balanced,0.03327466547489166
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,32,2,16,power_law_1.01,1.3883968353271485
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,32,2,16,power_law_1.2,0.07054719924926758
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,32,4,8,balanced,0.03433600068092346
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,32,2,16,balanced,0.3046773274739583
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,32,2,16,power_law_1.01,1.9068864822387694
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,32,2,16,power_law_1.2,0.07909759879112244
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,32,4,8,balanced,0.04015466570854187
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,32,2,16,power_law_1.2,0.09162880182266235
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,32,2,16,power_law_1.01,2.6964351654052736
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,32,2,16,power_law_1.2,0.12250239849090576
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,32,4,8,balanced,0.04154133299986521
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,32,2,16,power_law_1.2,0.13642239570617676
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,32,2,16,power_law_1.01,6.091654586791992
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,32,2,16,balanced,0.44644800821940106
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,32,2,16,power_law_1.2,0.1967039942741394
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,32,4,8,balanced,0.044362664222717285
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,32,2,16,power_law_1.2,0.2687936067581177
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,32,2,16,power_law_1.2,0.37932798862457273
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,32,2,16,power_law_1.2,0.4681536197662354
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,32,4,8,balanced,0.04619733492533366
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,32,2,16,balanced,0.586357315381368
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,32,2,16,power_law_1.2,0.735206413269043
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,32,2,16,power_law_1.2,0.9461631774902344
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,32,4,8,balanced,0.04875733455022176
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,32,2,16,power_law_1.2,1.5857407569885253
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,32,4,8,power_law_1.01,0.03333759903907776
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,32,2,16,power_law_1.2,1.6418752670288086
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,32,2,16,balanced,0.7267253398895264
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,32,4,8,power_law_1.01,0.033766400814056394
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,32,4,8,balanced,0.05867200096448263
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,32,2,16,power_law_1.2,2.417190361022949
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,32,4,8,power_law_1.01,0.03415040075778961
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,32,4,8,balanced,0.058464000622431435
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,32,4,8,power_law_1.01,0.03797119855880737
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,32,2,16,power_law_1.2,3.7304000854492188
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,32,4,8,power_law_1.01,0.04126720130443573
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,32,2,16,power_law_1.2,8.414335632324219
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,32,4,8,power_law_1.01,0.04449920058250427
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,32,4,8,balanced,0.05459733307361603
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,32,4,8,power_law_1.01,0.04643200039863586
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,32,4,8,balanced,0.0533493310213089
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,32,4,8,power_law_1.01,0.049619200825691226
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,32,4,8,balanced,0.05913066864013672
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,32,2,16,balanced,1.142346700032552
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,32,4,8,power_law_1.01,0.0591808021068573
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,32,4,8,balanced,0.05910933514436086
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,32,4,8,balanced,0.05996266504128774
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,32,4,8,power_law_1.01,0.059622400999069215
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,32,4,8,balanced,0.06057066718737284
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,32,4,8,power_law_1.01,0.056678402423858645
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,32,4,8,balanced,0.062496001521746315
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,32,4,8,balanced,0.06494399905204773
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,32,4,8,power_law_1.01,0.055878400802612305
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,32,4,8,balanced,0.0703413337469101
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,32,4,8,power_law_1.01,0.058796799182891844
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,32,4,8,balanced,0.09057066837946574
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,32,4,8,power_law_1.01,0.06334720253944397
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,32,4,8,balanced,0.09815999865531921
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,32,4,8,power_law_1.01,0.06395519971847534
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,32,4,8,power_law_1.01,0.07152640223503112
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,32,4,8,balanced,0.1474240024884542
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,32,4,8,power_law_1.01,0.07384960055351257
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,32,4,8,balanced,0.169706662495931
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,32,4,8,power_law_1.01,0.09316480159759521
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,32,4,8,power_law_1.01,0.11174399852752685
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,32,4,8,balanced,0.24445333083470663
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,32,4,8,power_law_1.01,0.131494402885437
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,32,4,8,power_law_1.01,0.16042879819869996
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,32,2,16,balanced,2.258298714955648
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,32,8,4,balanced,0.027808000644048054
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,32,4,8,power_law_1.2,0.03317759931087494
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,32,4,8,balanced,0.3040320078531901
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,32,4,8,power_law_1.01,0.2248447895050049
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,32,8,4,balanced,0.03162133445342382
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,32,4,8,power_law_1.2,0.0341376006603241
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,32,4,8,power_law_1.01,0.2811199903488159
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,32,8,4,balanced,0.03278400003910065
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,32,4,8,power_law_1.2,0.03375360071659088
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,32,4,8,power_law_1.01,0.42273921966552735
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,32,8,4,balanced,0.03645866612593333
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,32,4,8,balanced,0.44280532995859784
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,32,4,8,power_law_1.2,0.037868800759315493
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,32,4,8,power_law_1.01,0.5132480144500733
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,32,4,8,power_law_1.2,0.041382399201393125
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,32,8,4,balanced,0.03632533301909765
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,32,4,8,power_law_1.01,0.8257216453552246
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,32,4,8,power_law_1.2,0.04472320079803467
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,32,8,4,balanced,0.03642666588226954
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,32,4,8,power_law_1.01,1.1684415817260743
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,32,4,8,power_law_1.2,0.046438398957252505
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,32,4,8,balanced,0.5802613496780396
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,32,4,8,power_law_1.2,0.049670401215553286
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,32,4,8,power_law_1.01,1.4229503631591798
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,32,8,4,balanced,0.03977599988381068
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,32,4,8,power_law_1.2,0.05912960171699524
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,32,4,8,power_law_1.01,1.887775993347168
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,32,4,8,power_law_1.2,0.05986559987068176
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,32,4,8,power_law_1.01,3.8881473541259766
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,32,8,4,balanced,0.038389332592487335
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,32,4,8,power_law_1.2,0.05464320182800293
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,32,4,8,balanced,0.7200853029886881
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,32,4,8,power_law_1.2,0.05735039710998535
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,32,4,8,power_law_1.2,0.06432639956474304
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,32,8,4,balanced,0.04238399863243103
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,32,4,8,power_law_1.2,0.06526079773902893
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,32,4,8,power_law_1.2,0.07004160284996033
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,32,8,4,balanced,0.04354133208592733
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,32,4,8,power_law_1.2,0.07399680018424988
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,32,4,8,balanced,1.1316693623860676
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,32,8,4,balanced,0.042208001017570496
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,32,4,8,power_law_1.2,0.07571200132369996
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,32,8,4,power_law_1.01,0.02885119915008545
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,32,4,8,power_law_1.2,0.10235519409179687
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,32,8,4,power_law_1.01,0.031174400448799135
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,32,4,8,power_law_1.2,0.1217919945716858
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,32,8,4,power_law_1.01,0.03160319924354553
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,32,4,8,power_law_1.2,0.13779200315475465
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,32,8,4,balanced,0.05728533367315928
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,32,4,8,power_law_1.2,0.19830399751663208
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,32,8,4,power_law_1.01,0.034643200039863584
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,32,4,8,power_law_1.2,0.23911681175231933
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,32,8,4,power_law_1.01,0.03624959886074066
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,32,8,4,power_law_1.01,0.03670400083065033
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,32,4,8,power_law_1.2,0.3580415964126587
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,32,8,4,power_law_1.01,0.039980798959732056
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,32,4,8,power_law_1.2,0.5021376132965087
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,32,8,4,balanced,0.06053866446018219
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,32,8,4,power_law_1.01,0.04044800102710724
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,32,4,8,power_law_1.2,0.7228352069854737
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,32,8,4,balanced,0.05574933191140493
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,32,8,4,power_law_1.01,0.04373759925365448
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,32,4,8,power_law_1.2,1.1558848381042481
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,32,8,4,balanced,0.056277334690093994
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,32,8,4,power_law_1.01,0.04428800046443939
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,32,4,8,power_law_1.2,1.5271807670593263
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,32,8,4,balanced,0.06308266520500183
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,32,8,4,power_law_1.01,0.043507200479507444
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,32,4,8,balanced,2.233344078063965
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,32,4,8,power_law_1.2,1.538111972808838
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,32,8,4,balanced,0.06484800080458324
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,32,8,4,power_law_1.01,0.06046079993247986
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,32,8,4,balanced,0.0676693320274353
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,32,4,8,power_law_1.2,3.23306884765625
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,32,8,4,power_law_1.01,0.06039040088653565
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,32,8,4,power_law_1.01,0.05772799849510193
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,32,8,4,balanced,0.07473066449165344
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,32,4,8,power_law_1.2,5.984595108032226
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,32,8,4,power_law_1.2,0.028908801078796387
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,32,8,4,power_law_1.01,0.061408001184463504
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,32,8,4,balanced,0.09206933776537578
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,32,8,4,power_law_1.2,0.031711998581886294
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,32,8,4,power_law_1.01,0.06586880087852479
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,32,8,4,balanced,0.10131733616193135
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,32,8,4,power_law_1.2,0.03128319978713989
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,32,8,4,power_law_1.01,0.07134079933166504
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,32,8,4,power_law_1.2,0.0343423992395401
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,32,8,4,balanced,0.1507200002670288
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,32,8,4,power_law_1.01,0.07910400032997131
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,32,8,4,power_law_1.2,0.03635840117931366
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,32,8,4,power_law_1.01,0.0856000006198883
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,32,8,4,balanced,0.17930134137471518
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,32,8,4,power_law_1.2,0.0366784006357193
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,32,8,4,power_law_1.01,0.11960320472717285
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,32,8,4,power_law_1.2,0.03978239893913269
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,32,8,4,power_law_1.01,0.14307839870452882
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,32,8,4,balanced,0.2584799925486247
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,32,8,4,power_law_1.2,0.03966720104217529
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,32,8,4,power_law_1.01,0.198636794090271
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,32,8,4,power_law_1.2,0.04332799911499023
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,32,8,4,power_law_1.01,0.25596160888671876
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,32,8,4,power_law_1.2,0.04423039853572845
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,32,8,4,balanced,0.3168586691220601
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,32,8,4,power_law_1.2,0.04635519981384277
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,32,8,4,power_law_1.01,0.34333438873291017
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,32,8,4,power_law_1.2,0.06000639796257019
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,32,8,4,power_law_1.01,0.4567999839782715
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,32,16,2,balanced,0.02629333237806956
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,32,8,4,power_law_1.2,0.06287999749183655
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,32,8,4,balanced,0.4671786626180013
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,32,8,4,power_law_1.01,0.6556608200073242
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,32,16,2,balanced,0.029877332349618275
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,32,8,4,power_law_1.2,0.060134398937225345
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,32,8,4,power_law_1.01,0.878444766998291
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,32,16,2,balanced,0.030773334205150604
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,32,8,4,power_law_1.2,0.05976319909095764
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,32,16,2,balanced,0.036576000352700554
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,32,8,4,power_law_1.2,0.06593279838562012
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,32,8,4,power_law_1.01,1.0701248168945312
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,32,16,2,balanced,0.037077332536379494
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,32,8,4,power_law_1.2,0.07166079878807068
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,32,8,4,balanced,0.6020906766255697
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,32,8,4,power_law_1.01,1.7345920562744142
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,32,8,4,power_law_1.2,0.0798143982887268
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,32,16,2,balanced,0.03629866739114126
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,32,8,4,power_law_1.2,0.0980351984500885
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,32,8,4,power_law_1.01,4.154156875610352
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,32,8,4,power_law_1.2,0.12799999713897706
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,32,16,2,balanced,0.03741333385308584
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,32,8,4,power_law_1.2,0.1715008020401001
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,32,16,2,balanced,0.03722666700681051
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,32,8,4,balanced,0.7478293577829996
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,32,8,4,power_law_1.2,0.21068799495697021
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,32,8,4,power_law_1.2,0.2667327880859375
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,32,16,2,balanced,0.039749334255854286
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,32,8,4,power_law_1.2,0.4271359920501709
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,32,16,2,balanced,0.03862400104602178
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,32,8,4,power_law_1.2,0.4827263832092285
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,32,16,2,balanced,0.03913066784540812
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,32,8,4,power_law_1.2,0.7562240123748779
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,32,16,2,power_law_1.01,0.026521599292755126
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,32,8,4,power_law_1.2,1.0671744346618652
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,32,16,2,power_law_1.01,0.02905600070953369
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,32,16,2,balanced,0.04669333497683207
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,32,8,4,balanced,1.1737653414408367
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,32,16,2,power_law_1.01,0.029760000109672547
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,32,8,4,power_law_1.2,1.0941632270812989
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,32,16,2,balanced,0.04611733555793762
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,32,16,2,power_law_1.01,0.03357439935207367
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,32,8,4,power_law_1.2,2.4664703369140626
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,32,16,2,balanced,0.046911999583244324
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,32,16,2,power_law_1.01,0.036908799409866334
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,32,8,4,power_law_1.2,4.454342269897461
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,32,16,2,power_law_1.01,0.03627519905567169
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,32,16,2,power_law_1.01,0.038150399923324585
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,32,16,2,balanced,0.06560533245404561
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,32,16,2,power_law_1.01,0.04042240083217621
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,32,16,2,power_law_1.01,0.043750399351119997
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,32,16,2,balanced,0.06122666597366333
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,32,16,2,power_law_1.01,0.04506239891052246
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,32,16,2,balanced,0.06393600006898244
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,32,16,2,power_law_1.01,0.04579200148582459
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,32,16,2,balanced,0.07667733232180278
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,32,16,2,power_law_1.01,0.0482367992401123
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,32,16,2,balanced,0.08228800197442372
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,32,16,2,power_law_1.01,0.05069440007209778
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,32,16,2,balanced,0.10693333546320598
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,32,16,2,power_law_1.01,0.05325440168380737
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,32,8,4,balanced,2.3111839294433594
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,32,16,2,balanced,0.11662933230400085
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,32,16,2,power_law_1.01,0.07622399926185608
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,32,16,2,power_law_1.2,0.02691200077533722
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,32,16,2,balanced,0.176362673441569
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,32,16,2,power_law_1.01,0.08115199804306031
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,32,16,2,power_law_1.2,0.0293503999710083
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,32,16,2,power_law_1.01,0.08933759927749634
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,32,16,2,power_law_1.2,0.029446399211883544
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,32,16,2,balanced,0.2129813234011332
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,32,16,2,power_law_1.2,0.033983999490737916
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,32,16,2,power_law_1.01,0.08799999952316284
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,32,16,2,power_law_1.2,0.036857599020004274
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,32,16,2,balanced,0.3109760085741679
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,32,16,2,power_law_1.01,0.11208319664001465
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,32,16,2,power_law_1.2,0.03585279881954193
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,32,16,2,power_law_1.01,0.14123519659042358
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,32,16,2,power_law_1.2,0.03978239893913269
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,32,16,2,power_law_1.01,0.15493760108947754
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,32,16,2,balanced,0.40717868010203045
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,32,16,2,power_law_1.01,0.20499839782714843
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,32,16,2,power_law_1.2,0.0400191992521286
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,32,16,2,power_law_1.2,0.04390400052070618
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,32,16,2,power_law_1.01,0.29224319458007814
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,32,32,1,balanced,0.02387733260790507
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,32,16,2,power_law_1.01,0.41663360595703125
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,32,16,2,power_law_1.2,0.04466559886932373
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,32,16,2,balanced,0.5933440128962199
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,32,16,2,power_law_1.01,0.48903679847717285
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,32,32,1,balanced,0.025701334079106648
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,32,16,2,power_law_1.2,0.04542079865932465
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,32,32,1,balanced,0.02790933350721995
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,32,16,2,power_law_1.2,0.048127999901771544
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,32,16,2,power_law_1.01,0.6937600135803222
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,32,32,1,balanced,0.03499733408292135
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,32,32,1,balanced,0.03484266748030981
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,32,16,2,power_law_1.2,0.052313601970672606
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,32,16,2,power_law_1.01,0.9239040374755859
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,32,32,1,balanced,0.03515733281771342
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,32,16,2,balanced,0.7791626453399658
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,32,16,2,power_law_1.2,0.052902400493621826
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,32,32,1,balanced,0.03515200068553289
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,32,16,2,power_law_1.01,1.163929557800293
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,32,32,1,balanced,0.03369066615899404
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,32,16,2,power_law_1.2,0.07465599775314331
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,32,16,2,power_law_1.01,1.928825569152832
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,32,16,2,power_law_1.2,0.08216320276260376
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,32,32,1,balanced,0.03535466641187668
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,32,16,2,power_law_1.2,0.08923519849777221
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,32,16,2,power_law_1.01,3.6326656341552734
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,32,32,1,balanced,0.034389334420363106
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,32,32,1,power_law_1.01,0.023052799701690673
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,32,32,1,balanced,0.03454933315515518
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,32,16,2,power_law_1.2,0.09523199796676636
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,32,16,2,balanced,0.9639093081156412
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,32,32,1,power_law_1.01,0.024614399671554564
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,32,16,2,power_law_1.2,0.10973440408706665
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,32,32,1,balanced,0.038933334251244865
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,32,32,1,power_law_1.01,0.026163199543952943
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,32,16,2,power_law_1.2,0.1452415943145752
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,32,32,1,power_law_1.01,0.02928000092506409
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,32,16,2,power_law_1.2,0.16127359867095947
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,32,32,1,balanced,0.03806400050719579
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,32,32,1,power_law_1.01,0.03386240005493164
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,32,16,2,power_law_1.2,0.23406078815460205
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,32,32,1,balanced,0.03962666789690653
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,32,32,1,power_law_1.01,0.034483200311660765
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,32,16,2,power_law_1.2,0.27540481090545654
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,32,32,1,power_law_1.01,0.035283198952674864
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,32,16,2,power_law_1.2,0.4143231868743896
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,32,32,1,balanced,0.04631466666857401
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,32,16,2,balanced,1.514992078145345
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,32,32,1,power_law_1.01,0.03661440014839172
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,32,16,2,power_law_1.2,0.5634367942810059
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,32,32,1,power_law_1.01,0.03715839982032776
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,32,16,2,power_law_1.2,0.8546239852905273
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,32,32,1,power_law_1.01,0.03932799994945526
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,32,32,1,balanced,0.04728533327579498
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,32,16,2,power_law_1.2,0.9355199813842774
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,32,32,1,power_law_1.01,0.040531200170516965
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,32,32,1,balanced,0.0518453319867452
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,32,16,2,power_law_1.2,1.3103167533874511
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,32,32,1,power_law_1.01,0.04291839897632599
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,32,32,1,power_law_1.01,0.045311999320983884
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,32,16,2,power_law_1.2,2.1438272476196287
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,32,32,1,power_law_1.01,0.04766719937324524
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,32,16,2,power_law_1.2,3.9594047546386717
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,32,32,1,power_law_1.01,0.05399680137634277
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,32,32,1,balanced,0.07737599809964497
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,32,32,1,power_law_1.01,0.05971199870109558
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,32,32,1,balanced,0.08215466638406117
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,32,32,1,balanced,0.12226667006810506
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,32,32,1,power_law_1.01,0.06336640119552613
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,32,32,1,power_law_1.01,0.10166399478912354
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,32,32,1,balanced,0.13313066959381104
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,32,32,1,power_law_1.01,0.11282559633255004
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,32,32,1,power_law_1.2,0.023193599283695222
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,32,32,1,balanced,0.20136533180872598
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,32,32,1,power_law_1.01,0.14880640506744386
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,32,16,2,balanced,2.9894933700561523
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,32,32,1,power_law_1.2,0.024556800723075867
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,32,32,1,balanced,0.2498133381207784
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,32,32,1,power_law_1.01,0.1712767958641052
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,32,32,1,power_law_1.2,0.02542079985141754
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,32,32,1,power_law_1.01,0.21898241043090821
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,32,32,1,balanced,0.3677866856257121
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,32,32,1,power_law_1.2,0.02905600070953369
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,32,32,1,power_law_1.01,0.2865920066833496
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,32,32,1,power_law_1.2,0.0338239997625351
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,32,32,1,power_law_1.01,0.40341758728027344
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,32,32,1,balanced,0.4807200034459432
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,32,32,1,power_law_1.2,0.0344895988702774
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,32,32,1,power_law_1.01,0.5158016204833984
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,32,32,1,power_law_1.2,0.035417601466178894
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,32,32,1,power_law_1.01,0.737497615814209
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,32,32,1,power_law_1.2,0.036908799409866334
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,32,32,1,balanced,0.7052426338195801
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,32,32,1,power_law_1.01,0.961023998260498
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,32,32,1,power_law_1.2,0.03743360042572021
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,32,32,1,power_law_1.01,1.1756799697875977
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,32,32,1,power_law_1.2,0.03906559944152832
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,4096,14336,2,8,8,8,balanced,0.04374399781227112
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,32,32,1,power_law_1.2,0.04068480134010315
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,32,32,1,power_law_1.01,1.8330112457275392
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,32,32,1,balanced,0.9269386927286783
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,4096,14336,2,8,8,8,balanced,0.042447999119758606
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,32,32,1,power_law_1.2,0.04429439902305603
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,4096,14336,2,8,8,8,balanced,0.040474665661652885
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,32,32,1,power_law_1.01,3.6103679656982424
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,32,32,1,power_law_1.2,0.04490880072116852
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,4096,14336,2,8,8,8,balanced,0.04142933338880539
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,32,32,1,power_law_1.2,0.04743039906024933
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,4096,14336,2,8,8,8,balanced,0.0349440003434817
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,4096,14336,2,8,8,8,balanced,0.042021334171295166
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,32,32,1,power_law_1.2,0.053420799970626834
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,4096,14336,2,8,8,8,balanced,0.04256533086299896
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,4096,14336,2,8,8,8,balanced,0.03764266769091288
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,32,32,1,balanced,1.149450699488322
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,32,32,1,power_law_1.2,0.05960959792137146
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,4096,14336,2,8,8,8,balanced,0.04340800146261851
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,4096,14336,2,8,8,8,balanced,0.03522133330504099
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,4096,14336,2,8,8,8,balanced,0.043840001026789345
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,32,32,1,power_law_1.2,0.06401919722557067
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,4096,14336,2,8,8,8,balanced,0.036362667878468834
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,4096,14336,2,8,8,8,balanced,0.04456533491611481
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,32,32,1,power_law_1.2,0.10081919431686401
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,4096,14336,2,8,8,8,balanced,0.03661333272854487
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,4096,14336,2,8,8,8,balanced,0.04437866806983948
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,32,32,1,power_law_1.2,0.11162240505218506
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,4096,14336,2,8,8,8,balanced,0.042912001411120095
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,4096,14336,2,8,8,8,balanced,0.036831999818483986
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,32,32,1,power_law_1.2,0.14839040040969848
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,4096,14336,2,8,8,8,balanced,0.04351999859015147
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,4096,14336,2,8,8,8,balanced,0.03665599972009659
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,32,32,1,power_law_1.2,0.17237119674682616
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,4096,14336,2,8,8,8,balanced,0.04304533203442892
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,32,32,1,balanced,1.8104747136433919
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,32,32,1,power_law_1.2,0.21739521026611328
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,4096,14336,2,8,8,8,balanced,0.036389333506425224
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,4096,14336,2,8,8,8,balanced,0.038005332152048744
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,32,32,1,power_law_1.2,0.28679680824279785
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,4096,14336,2,8,8,8,balanced,0.047322665651639305
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,4096,14336,2,8,8,8,balanced,0.05213866631189982
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,4096,14336,2,8,8,8,balanced,0.03766933331886927
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,32,32,1,power_law_1.2,0.40261120796203614
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,4096,14336,2,8,8,8,balanced,0.052986666560173035
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,4096,14336,2,8,8,8,balanced,0.037045332292715706
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,32,32,1,power_law_1.2,0.5130176067352294
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,4096,14336,2,8,8,8,balanced,0.05305066704750061
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,4096,14336,2,8,8,8,balanced,0.03710933278004328
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,32,32,1,power_law_1.2,0.7354559898376465
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,4096,14336,2,8,8,8,balanced,0.037461332976818085
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,4096,14336,2,8,8,8,balanced,0.06041066845258077
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,32,32,1,power_law_1.2,0.9500160217285156
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,4096,14336,2,8,8,8,balanced,0.038389332592487335
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,4096,14336,2,8,8,8,balanced,0.05779199798901876
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,32,32,1,power_law_1.2,1.1711359977722169
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,4096,14336,2,8,8,8,balanced,0.04222933451334635
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,4096,14336,2,8,8,8,balanced,0.07735466460386912
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,32,32,1,power_law_1.2,1.8267583847045898
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,4096,14336,2,8,8,8,balanced,0.0759093314409256
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,4096,14336,2,8,8,8,balanced,0.04309333364168803
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,32,32,1,power_law_1.2,3.591737747192383
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,4096,14336,2,8,8,8,balanced,0.10341333349545796
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,4096,14336,2,8,8,8,balanced,0.044981335600217186
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,4096,14336,2,8,8,8,balanced,0.10931733250617981
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,4096,14336,2,8,8,8,balanced,0.0544106662273407
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,32,32,1,balanced,3.5760908126831055
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,4096,14336,2,8,8,8,balanced,0.05572799841562907
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,4096,14336,2,8,8,8,balanced,0.17771732807159424
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,4096,14336,2,8,8,8,balanced,0.07629866898059845
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,4096,14336,2,8,8,8,balanced,0.18639999628067017
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,4096,14336,2,8,8,8,balanced,0.08041066428025563
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,4096,14336,2,8,8,8,balanced,0.10811733206113179
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,4096,14336,2,8,8,8,balanced,0.2645333409309387
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,4096,14336,2,8,8,8,balanced,0.1227946678797404
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,4096,14336,2,8,8,8,balanced,0.3431626558303833
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,4096,14336,2,8,8,8,balanced,0.026672000686327618
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,4096,14336,2,8,8,8,balanced,0.1771893302599589
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,4096,14336,2,8,8,8,balanced,0.026762666801611584
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,4096,14336,2,8,8,8,balanced,0.2054133415222168
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,4096,14336,2,8,8,8,balanced,0.42028268178304035
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,4096,14336,2,8,8,8,balanced,0.026543999711672466
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,4096,14336,2,8,8,8,balanced,0.028016000986099243
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,4096,14336,2,8,8,8,balanced,0.028815999627113342
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,4096,14336,2,8,8,8,balanced,0.2916853427886963
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,4096,14336,2,8,8,8,balanced,0.02938133229811986
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,4096,14336,2,8,8,8,balanced,0.029365333418051403
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,4096,14336,2,8,8,8,balanced,0.6054826577504476
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,4096,14336,2,8,8,8,balanced,0.02934933453798294
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,4096,14336,2,8,8,8,balanced,0.3729226589202881
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,4096,14336,2,8,8,8,power_law_1.01,0.04193280041217804
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,4096,14336,2,8,8,8,balanced,0.030224000414212544
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,4096,14336,2,8,8,8,balanced,0.03014933317899704
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,4096,14336,2,8,8,8,power_law_1.01,0.040870401263237
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,4096,14336,2,8,8,8,power_law_1.01,0.04004479944705963
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,4096,14336,2,8,8,8,balanced,0.4569600025812785
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,4096,14336,2,8,8,8,power_law_1.01,0.042342400550842284
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,4096,14336,2,8,8,8,power_law_1.01,0.042361599206924436
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,4096,14336,2,8,8,8,power_law_1.01,0.04355199933052063
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,4096,14336,2,8,8,8,balanced,1.174832026163737
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,4096,14336,2,8,8,8,balanced,0.030368000268936157
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,4096,14336,2,8,8,8,power_law_1.01,0.03443840146064758
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,4096,14336,2,8,8,8,power_law_1.01,0.04635519981384277
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,4096,14336,2,8,8,8,balanced,0.6966719627380371
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,4096,14336,2,8,8,8,balanced,0.030773334205150604
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,4096,14336,2,8,8,8,power_law_1.01,0.0363072007894516
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,4096,14336,2,8,8,8,power_law_1.01,0.04989440143108368
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,4096,14336,2,8,8,8,power_law_1.01,0.03436799943447113
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,4096,14336,2,8,8,8,balanced,0.031632001201311745
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,4096,14336,2,8,8,8,power_law_1.01,0.057094401121139525
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,4096,14336,2,8,8,8,power_law_1.01,0.03555200099945068
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,4096,14336,2,8,8,8,balanced,0.030234667162100475
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,4096,14336,2,8,8,8,power_law_1.01,0.05761280059814453
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,4096,14336,2,8,8,8,power_law_1.01,0.03566080033779144
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,4096,14336,2,8,8,8,power_law_1.01,0.056441599130630495
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,4096,14336,2,8,8,8,power_law_1.01,0.03668479919433594
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,4096,14336,2,8,8,8,power_law_1.01,0.06032639741897583
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,4096,14336,2,8,8,8,power_law_1.01,0.03715839982032776
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,4096,14336,2,8,8,8,power_law_1.01,0.06773120164871216
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,4096,14336,2,8,8,8,balanced,1.3302026589711506
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,4096,14336,2,8,8,8,balanced,0.03825599948565165
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,4096,14336,2,8,8,8,power_law_1.01,0.05891839861869812
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,4096,14336,2,8,8,8,power_law_1.01,0.038099199533462524
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,4096,14336,2,8,8,8,power_law_1.01,0.06938880085945129
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,4096,14336,2,8,8,8,balanced,0.03830400109291077
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,4096,14336,2,8,8,8,power_law_1.01,0.03886080086231232
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,4096,14336,2,8,8,8,power_law_1.01,0.07877119779586791
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,4096,14336,2,8,8,8,balanced,0.03853866706291834
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,4096,14336,2,8,8,8,power_law_1.01,0.04658559858798981
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,4096,14336,2,8,8,8,power_law_1.01,0.09049599766731262
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,4096,14336,2,8,8,8,power_law_1.01,0.04447360038757324
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,4096,14336,2,8,8,8,power_law_1.01,0.11503360271453858
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,4096,14336,2,8,8,8,power_law_1.01,0.05061119794845581
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,4096,14336,2,8,8,8,power_law_1.01,0.11485439538955688
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,4096,14336,2,8,8,8,power_law_1.01,0.04961279928684235
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,4096,14336,2,8,8,8,power_law_1.01,0.16109440326690674
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,4096,14336,2,8,8,8,power_law_1.01,0.04403199851512909
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,4096,14336,2,8,8,8,power_law_1.01,0.2006592035293579
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,4096,14336,2,8,8,8,balanced,0.049072002371152244
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,4096,14336,2,8,8,8,power_law_1.01,0.02619520127773285
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,4096,14336,2,8,8,8,power_law_1.01,0.05935360193252563
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,4096,14336,2,8,8,8,power_law_1.01,0.2721280097961426
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,4096,14336,2,8,8,8,balanced,0.050581331054369606
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,4096,14336,2,8,8,8,power_law_1.01,0.0262719988822937
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,4096,14336,2,8,8,8,power_law_1.01,0.05961599946022034
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,4096,14336,2,8,8,8,power_law_1.01,0.2991487979888916
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,4096,14336,2,8,8,8,power_law_1.01,0.026604801416397095
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,4096,14336,2,8,8,8,power_law_1.01,0.06335359811782837
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,4096,14336,2,8,8,8,power_law_1.01,0.43619837760925295
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,4096,14336,2,8,8,8,power_law_1.01,0.02826879918575287
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,4096,14336,2,8,8,8,power_law_1.01,0.08310400247573853
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,4096,14336,2,8,8,8,power_law_1.01,0.5477248191833496
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,4096,14336,2,8,8,8,power_law_1.01,0.0964352011680603
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,4096,14336,2,8,8,8,power_law_1.01,0.028505599498748778
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,4096,14336,2,8,8,8,power_law_1.01,0.8245759963989258
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,4096,14336,2,8,8,8,power_law_1.01,0.12878079414367677
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,4096,14336,2,8,8,8,power_law_1.01,0.02990719974040985
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,4096,14336,2,8,8,8,power_law_1.01,0.9986495971679688
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,4096,14336,2,8,8,8,power_law_1.01,0.030508801341056824
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,4096,14336,2,8,8,8,balanced,0.06274666885534923
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,4096,14336,2,8,8,8,power_law_1.01,0.14458880424499512
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,4096,14336,2,8,8,8,power_law_1.01,1.3923392295837402
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,4096,14336,2,8,8,8,power_law_1.01,0.030956798791885377
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,4096,14336,2,8,8,8,power_law_1.01,0.20545918941497804
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,4096,14336,2,8,8,8,power_law_1.01,0.03495039939880371
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,4096,14336,2,8,8,8,power_law_1.01,0.252512001991272
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,4096,14336,2,8,8,8,power_law_1.01,2.097248077392578
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,4096,14336,2,8,8,8,power_law_1.01,0.03731839954853058
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,4096,14336,2,8,8,8,power_law_1.01,0.3727871894836426
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,4096,14336,2,8,8,8,power_law_1.01,3.6628929138183595
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,4096,14336,2,8,8,8,power_law_1.01,0.43571200370788576
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,4096,14336,2,8,8,8,power_law_1.01,0.631712007522583
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,4096,14336,2,8,8,8,power_law_1.01,0.039027199149131775
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,4096,14336,2,8,8,8,balanced,0.07172800103823344
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,4096,14336,2,8,8,8,power_law_1.01,0.8636223793029785
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,4096,14336,2,8,8,8,power_law_1.01,0.04492799937725067
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,4096,14336,2,8,8,8,power_law_1.01,0.04750719964504242
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,4096,14336,2,8,8,8,power_law_1.01,1.0571904182434082
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,4096,14336,2,8,8,8,balanced,0.09731200337409973
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,4096,14336,2,8,8,8,power_law_1.01,0.054028797149658206
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,4096,14336,2,8,8,8,power_law_1.01,1.6937471389770509
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,4096,14336,2,8,8,8,power_law_1.01,3.1646080017089844
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,4096,14336,2,8,8,8,power_law_1.01,0.05370240211486817
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,4096,14336,2,8,8,8,balanced,0.11571199695269267
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,4096,14336,2,8,8,8,power_law_1.2,0.04136959910392761
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,4096,14336,2,8,8,8,power_law_1.2,0.03436799943447113
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,4096,14336,2,8,8,8,power_law_1.01,0.0646016001701355
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,4096,14336,2,8,8,8,power_law_1.2,0.0411327987909317
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,4096,14336,2,8,8,8,balanced,0.16090666254361471
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,4096,14336,2,8,8,8,power_law_1.2,0.03694719970226288
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,4096,14336,2,8,8,8,power_law_1.01,0.08158079981803894
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,4096,14336,2,8,8,8,power_law_1.2,0.04005120098590851
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,4096,14336,2,8,8,8,power_law_1.2,0.03470720052719116
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,4096,14336,2,8,8,8,power_law_1.2,0.04147840142250061
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,4096,14336,2,8,8,8,power_law_1.2,0.04165120124816894
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,4096,14336,2,8,8,8,balanced,0.20507733027140299
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,4096,14336,2,8,8,8,power_law_1.2,0.03530240058898926
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,4096,14336,2,8,8,8,power_law_1.01,0.08788480162620545
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,4096,14336,2,8,8,8,power_law_1.2,0.0435263991355896
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,4096,14336,2,8,8,8,power_law_1.2,0.035392001271247864
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,4096,14336,2,8,8,8,power_law_1.2,0.04688639938831329
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,4096,14336,2,8,8,8,power_law_1.01,0.10616320371627808
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,4096,14336,2,8,8,8,power_law_1.2,0.03683840036392212
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,4096,14336,2,8,8,8,balanced,0.3043946623802185
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,4096,14336,2,8,8,8,power_law_1.2,0.04863359928131104
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,4096,14336,2,8,8,8,power_law_1.2,0.06225919723510742
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,4096,14336,2,8,8,8,power_law_1.2,0.03747200071811676
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,4096,14336,2,8,8,8,power_law_1.2,0.0578495979309082
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,4096,14336,2,8,8,8,power_law_1.2,0.05682560205459595
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,4096,14336,2,8,8,8,power_law_1.2,0.03866879940032959
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,4096,14336,2,8,8,8,power_law_1.01,0.14793599843978883
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,4096,14336,2,8,8,8,power_law_1.2,0.06966400146484375
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,4096,14336,2,8,8,8,balanced,0.3987199862798055
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,4096,14336,2,8,8,8,power_law_1.2,0.04261760115623474
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,4096,14336,2,8,8,8,power_law_1.2,0.0679423987865448
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,4096,14336,2,8,8,8,power_law_1.2,0.05888640284538269
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,4096,14336,2,8,8,8,power_law_1.2,0.04503679871559143
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,4096,14336,2,8,8,8,power_law_1.2,0.06970239877700805
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,4096,14336,2,8,8,8,power_law_1.2,0.04492799937725067
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,4096,14336,2,8,8,8,power_law_1.01,0.17575039863586425
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,4096,14336,2,8,8,8,power_law_1.2,0.07805439829826355
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,4096,14336,2,8,8,8,power_law_1.2,0.052211201190948485
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,4096,14336,2,8,8,8,balanced,0.500437339146932
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,4096,14336,2,8,8,8,power_law_1.2,0.08993279933929443
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,4096,14336,2,8,8,8,power_law_1.01,0.24746880531311036
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,4096,14336,2,8,8,8,power_law_1.2,0.05397760272026062
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,4096,14336,2,8,8,8,power_law_1.2,0.11473920345306396
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,4096,14336,2,8,8,8,power_law_1.2,0.11991039514541627
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,4096,14336,2,8,8,8,power_law_1.2,0.04737280011177063
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,4096,14336,2,8,8,8,power_law_1.2,0.17320319414138793
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,4096,14336,2,8,8,8,power_law_1.01,0.3669248104095459
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,4096,14336,2,8,8,8,power_law_1.2,0.06147199869155884
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,4096,14336,2,8,8,8,power_law_1.2,0.20650238990783693
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,4096,14336,2,8,8,8,power_law_1.2,0.2770303964614868
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,4096,14336,2,8,8,8,power_law_1.01,0.5409855842590332
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,4096,14336,2,8,8,8,power_law_1.2,0.06093440055847168
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,4096,14336,2,8,8,8,power_law_1.2,0.3138047933578491
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,4096,14336,2,8,8,8,balanced,0.7893173694610596
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,4096,14336,2,8,8,8,power_law_1.2,0.06774399876594543
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,4096,14336,2,8,8,8,power_law_1.01,0.6887231826782226
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,4096,14336,2,8,8,8,power_law_1.2,0.4276991844177246
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,4096,14336,2,8,8,8,power_law_1.2,0.08386560082435608
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,4096,14336,2,8,8,8,power_law_1.2,0.5489727973937988
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,4096,14336,2,8,8,8,power_law_1.01,1.05163516998291
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,4096,14336,2,8,8,8,power_law_1.2,0.7479487895965576
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,4096,14336,2,8,8,8,power_law_1.2,0.09662079811096191
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,4096,14336,2,8,8,8,power_law_1.2,1.1331904411315918
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,4096,14336,2,8,8,8,power_law_1.01,1.2506367683410644
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,4096,14336,2,8,8,8,power_law_1.2,0.1161728024482727
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,4096,14336,2,8,8,8,power_law_1.2,1.3222847938537599
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,4096,14336,2,8,8,8,power_law_1.2,0.13760000467300415
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,4096,14336,2,8,8,8,power_law_1.01,1.5599167823791504
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,4096,14336,2,8,8,8,power_law_1.2,2.0601024627685547
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,4096,14336,2,8,8,8,power_law_1.2,0.21043200492858888
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,4096,14336,2,8,8,8,power_law_1.01,2.627731132507324
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,4096,14336,2,8,8,8,power_law_1.2,4.197107315063477
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,4096,14336,2,8,8,8,power_law_1.2,0.24774401187896727
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,4096,14336,2,8,8,8,power_law_1.01,4.723673629760742
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,4096,14336,2,8,8,8,power_law_1.2,0.026099199056625368
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,4096,14336,2,8,8,8,power_law_1.2,0.36309759616851806
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,4096,14336,2,8,8,8,balanced,1.5398400624593098
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,4096,14336,2,8,8,8,power_law_1.2,0.41804800033569334
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,4096,14336,2,8,8,8,power_law_1.2,0.0263808012008667
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,4096,14336,2,8,8,8,power_law_1.2,0.6529407978057862
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,4096,14336,2,8,8,8,power_law_1.2,0.02655999958515167
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,4096,14336,2,8,8,8,power_law_1.2,0.8979904174804687
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,4096,14336,2,8,8,8,power_law_1.2,0.028064000606536865
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,4096,14336,2,8,8,8,power_law_1.2,1.1107328414916993
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,4096,14336,2,8,8,8,power_law_1.2,0.028313601016998292
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,4096,14336,2,8,8,8,power_law_1.2,0.030105599761009218
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,4096,14336,2,8,8,8,power_law_1.2,1.714681625366211
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,4096,14336,2,8,8,8,power_law_1.2,0.030681601166725157
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,4096,14336,2,8,8,8,power_law_1.2,3.233990478515625
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,4096,14336,2,8,8,8,power_law_1.2,0.030649599432945252
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,4096,14336,2,8,8,8,power_law_1.2,0.034867200255393985
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,4096,14336,2,8,8,8,power_law_1.2,0.04128639996051788
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,4096,14336,2,8,16,4,balanced,0.033861334125200905
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,4096,14336,2,8,16,4,balanced,0.03446933378775915
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,4096,14336,2,8,8,8,power_law_1.2,0.03896960020065308
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,4096,14336,2,8,16,4,balanced,0.03931200007597605
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,4096,14336,2,8,8,8,power_law_1.2,0.04644480049610138
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,4096,14336,2,8,16,4,balanced,0.038805333276589714
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,4096,14336,2,8,8,8,power_law_1.2,0.04854399859905243
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,4096,14336,2,8,16,4,balanced,0.03940266619126002
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,4096,14336,2,8,8,8,power_law_1.2,0.058246397972106935
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,4096,14336,2,8,16,4,balanced,0.04098666707674662
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,4096,14336,2,8,16,4,balanced,0.04186666508515676
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,4096,14336,2,8,16,4,balanced,0.04205333193143209
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,4096,14336,2,8,8,8,power_law_1.2,0.06314880251884461
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,4096,14336,2,8,8,8,power_law_1.2,0.06472319960594178
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,4096,14336,2,8,16,4,balanced,0.04381866753101349
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,4096,14336,2,8,16,4,balanced,0.04378666480382284
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,4096,14336,2,8,8,8,power_law_1.2,0.08012160062789916
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,4096,14336,2,8,16,4,balanced,0.04246933261553446
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,4096,14336,2,8,16,4,balanced,0.04422399898370107
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,4096,14336,2,8,8,8,power_law_1.2,0.08908159732818603
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,4096,14336,2,8,16,4,balanced,0.0436106671889623
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,4096,14336,2,8,16,4,balanced,0.03330666571855545
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,4096,14336,2,8,16,4,balanced,0.047413334250450134
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,4096,14336,2,8,8,8,power_law_1.2,0.10910719633102417
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,4096,14336,2,8,16,4,balanced,0.033088001112143196
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,4096,14336,2,8,16,4,balanced,0.05355200171470642
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,4096,14336,2,8,16,4,balanced,0.03461866577466329
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,4096,14336,2,8,16,4,balanced,0.054010664423306785
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,4096,14336,2,8,16,4,balanced,0.03578133384386698
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,4096,14336,2,8,8,8,power_law_1.2,0.14878079891204835
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,4096,14336,2,8,16,4,balanced,0.03585600107908249
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,4096,14336,2,8,16,4,balanced,0.05322133501370748
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,4096,14336,2,8,16,4,balanced,0.03618666778008143
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,4096,14336,2,8,16,4,balanced,0.06509333352247874
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,4096,14336,2,8,16,4,balanced,0.036576000352700554
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,4096,14336,2,8,8,8,power_law_1.2,0.18087040185928344
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,4096,14336,2,8,16,4,balanced,0.06307733555634816
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,4096,14336,2,8,16,4,balanced,0.03615466753641764
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,4096,14336,2,8,8,8,power_law_1.2,0.280294394493103
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,4096,14336,2,8,16,4,balanced,0.07898666461308797
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,4096,14336,2,8,16,4,balanced,0.03730666637420654
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,4096,14336,2,8,16,4,balanced,0.07971733311812083
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,4096,14336,2,8,8,8,power_law_1.2,0.3640448093414307
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,4096,14336,2,8,16,4,balanced,0.0372533326347669
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,4096,14336,2,8,16,4,balanced,0.11335999766985576
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,4096,14336,2,8,8,8,power_law_1.2,0.5069375991821289
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,4096,14336,2,8,16,4,balanced,0.037104000647862755
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,4096,14336,2,8,16,4,balanced,0.12089600165685017
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,4096,14336,2,8,16,4,balanced,0.037647999823093414
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,4096,14336,2,8,8,8,power_law_1.2,0.7025856018066406
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,4096,14336,2,8,16,4,balanced,0.038362666964530945
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,4096,14336,2,8,16,4,balanced,0.18573333819707236
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,4096,14336,2,8,8,8,power_law_1.2,1.0751999855041503
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,4096,14336,2,8,16,4,balanced,0.03965333352486292
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,4096,14336,2,8,16,4,balanced,0.025807999074459076
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,4096,14336,2,8,8,8,power_law_1.2,1.3726335525512696
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,4096,14336,2,8,16,4,balanced,0.0487306664387385
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,4096,14336,2,8,16,4,balanced,0.21141332387924194
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,4096,14336,2,8,16,4,balanced,0.02586666742960612
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,4096,14336,2,8,8,8,power_law_1.2,1.6662975311279298
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,4096,14336,2,8,16,4,balanced,0.04924799998601278
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,4096,14336,2,8,16,4,balanced,0.026762666801611584
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,4096,14336,2,8,16,4,balanced,0.04665066798528036
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,4096,14336,2,8,8,8,power_law_1.2,2.666009521484375
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,4096,14336,2,8,16,4,balanced,0.30164267619450885
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,4096,14336,2,8,16,4,balanced,0.027834666272004444
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,4096,14336,2,8,16,4,balanced,0.06112533311049143
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,4096,14336,2,8,8,8,power_law_1.2,5.1298881530761715
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,4096,14336,2,8,16,4,balanced,0.02908266584078471
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,4096,14336,2,8,16,4,balanced,0.0613013356924057
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,4096,14336,2,8,16,4,balanced,0.029215998947620392
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,4096,14336,2,8,16,4,balanced,0.3906559944152832
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,4096,14336,2,8,16,4,balanced,0.07996800045172374
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,4096,14336,2,8,16,4,balanced,0.02941333254178365
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,4096,14336,2,8,16,4,balanced,0.08559999863306682
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,4096,14336,2,8,16,4,balanced,0.029002666473388672
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,4096,14336,2,8,16,4,balanced,0.03033066789309184
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,4096,14336,2,8,16,4,balanced,0.11764267086982727
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,4096,14336,2,8,16,4,balanced,0.4822080135345459
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,4096,14336,2,8,16,4,balanced,0.031018666923046112
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,4096,14336,2,8,16,4,balanced,0.13356799880663553
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,4096,14336,2,8,16,4,balanced,0.19485332568486533
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,4096,14336,2,8,16,4,balanced,0.7210400104522705
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,4096,14336,2,8,16,4,balanced,0.23430933554967245
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,4096,14336,2,8,16,4,balanced,0.030447999636332195
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,4096,14336,2,8,16,4,power_law_1.01,0.037555199861526486
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,4096,14336,2,8,16,4,balanced,0.031178665657838184
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,4096,14336,2,8,16,4,power_law_1.01,0.0390720009803772
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,4096,14336,2,8,16,4,balanced,0.3356959819793701
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,4096,14336,2,8,16,4,balanced,0.03204799940188726
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,4096,14336,2,8,16,4,power_law_1.01,0.03628160059452057
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,4096,14336,2,8,16,4,power_law_1.01,0.039552000164985654
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,4096,14336,2,8,16,4,balanced,0.03128000100453695
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,4096,14336,2,8,16,4,balanced,0.43022934595743817
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,4096,14336,2,8,16,4,power_law_1.01,0.039059200882911684
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,4096,14336,2,8,16,4,power_law_1.01,0.04344319999217987
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,4096,14336,2,8,16,4,power_law_1.01,0.04439679980278015
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,4096,14336,2,8,16,4,power_law_1.01,0.03588480055332184
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,4096,14336,2,8,16,4,balanced,1.3504533767700195
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,4096,14336,2,8,16,4,power_law_1.01,0.04694400131702423
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,4096,14336,2,8,16,4,balanced,0.528277317682902
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,4096,14336,2,8,16,4,power_law_1.01,0.03451519906520843
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,4096,14336,2,8,16,4,balanced,0.039621333281199135
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,4096,14336,2,8,16,4,power_law_1.01,0.048563200235366824
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,4096,14336,2,8,16,4,power_law_1.01,0.03293440043926239
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,4096,14336,2,8,16,4,balanced,0.040720000863075256
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,4096,14336,2,8,16,4,power_law_1.01,0.049420800805091855
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,4096,14336,2,8,16,4,power_law_1.01,0.035097599029541016
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,4096,14336,2,8,16,4,power_law_1.01,0.04749439954757691
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,4096,14336,2,8,16,4,balanced,0.0412266676624616
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,4096,14336,2,8,16,4,power_law_1.01,0.03496319949626923
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,4096,14336,2,8,16,4,power_law_1.01,0.057011198997497556
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,4096,14336,2,8,16,4,balanced,0.8082559903462728
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,4096,14336,2,8,16,4,power_law_1.01,0.035872000455856326
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,4096,14336,2,8,16,4,power_law_1.01,0.05914239883422852
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,4096,14336,2,8,16,4,power_law_1.01,0.025887998938560485
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,4096,14336,2,8,16,4,power_law_1.01,0.036051198840141296
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,4096,14336,2,8,16,4,balanced,0.05327466626962026
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,4096,14336,2,8,16,4,power_law_1.01,0.0537280023097992
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,4096,14336,2,8,16,4,power_law_1.2,0.03575679957866669
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,4096,14336,2,8,16,4,power_law_1.01,0.03767040073871612
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,4096,14336,2,8,16,4,balanced,0.05835733314355215
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,4096,14336,2,8,16,4,power_law_1.01,0.02563839852809906
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,4096,14336,2,8,16,4,power_law_1.01,0.06313599944114685
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,4096,14336,2,8,16,4,power_law_1.2,0.03730559945106506
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,4096,14336,2,8,16,4,power_law_1.01,0.025887998938560485
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,4096,14336,2,8,16,4,power_law_1.01,0.039673599600791934
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,4096,14336,2,8,16,4,power_law_1.01,0.06097919940948486
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,4096,14336,2,8,16,4,power_law_1.01,0.027769601345062254
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,4096,14336,2,8,16,4,power_law_1.2,0.03749119937419891
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,4096,14336,2,8,16,4,power_law_1.01,0.027897599339485168
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,4096,14336,2,8,16,4,power_law_1.01,0.040403199195861814
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,4096,14336,2,8,16,4,power_law_1.01,0.07522559762001038
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,4096,14336,2,8,16,4,power_law_1.2,0.038700801134109494
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,4096,14336,2,8,16,4,power_law_1.01,0.029151999950408937
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,4096,14336,2,8,16,4,power_law_1.01,0.04232319891452789
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,4096,14336,2,8,16,4,power_law_1.01,0.029900801181793214
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,4096,14336,2,8,16,4,power_law_1.01,0.10083199739456176
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,4096,14336,2,8,16,4,power_law_1.2,0.03937279880046844
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,4096,14336,2,8,16,4,balanced,1.5558560689290364
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,4096,14336,2,8,16,4,power_law_1.01,0.031411200761795044
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,4096,14336,2,8,16,4,power_law_1.01,0.04436480104923248
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,4096,14336,2,8,16,4,power_law_1.01,0.03213439881801605
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,4096,14336,2,8,16,4,power_law_1.01,0.10371840000152588
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,4096,14336,2,8,16,4,power_law_1.2,0.04270080029964447
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,4096,14336,2,8,16,4,power_law_1.01,0.047353601455688475
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,4096,14336,2,8,16,4,balanced,0.07415999968846639
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,4096,14336,2,8,16,4,power_law_1.01,0.03377279937267304
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,4096,14336,2,8,16,4,power_law_1.01,0.14755840301513673
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,4096,14336,2,8,16,4,power_law_1.2,0.04336000084877014
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,4096,14336,2,8,16,4,power_law_1.01,0.05281919836997986
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,4096,14336,2,8,16,4,power_law_1.01,0.14721920490264892
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,4096,14336,2,8,16,4,power_law_1.2,0.04785920083522797
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,4096,14336,2,8,16,4,power_law_1.01,0.06004480123519897
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,4096,14336,2,8,16,4,power_law_1.01,0.039136001467704774
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,4096,14336,2,8,16,4,power_law_1.01,0.19644800424575806
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,4096,14336,2,8,16,4,power_law_1.2,0.0482367992401123
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,4096,14336,2,8,16,4,power_law_1.01,0.06444159746170045
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,4096,14336,2,8,16,4,power_law_1.01,0.04058879911899567
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,4096,14336,2,8,16,4,power_law_1.01,0.22322559356689453
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,4096,14336,2,8,16,4,power_law_1.2,0.049132800102233885
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,4096,14336,2,8,16,4,power_law_1.01,0.045388799905776975
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,4096,14336,2,8,16,4,balanced,0.08545600374539693
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,4096,14336,2,8,16,4,power_law_1.01,0.06313599944114685
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,4096,14336,2,8,16,4,power_law_1.01,0.04917120039463043
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,4096,14336,2,8,16,4,power_law_1.2,0.04707199931144714
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,4096,14336,2,8,16,4,power_law_1.01,0.33889920711517335
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,4096,14336,2,8,16,4,power_law_1.01,0.08270080089569092
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,4096,14336,2,8,16,4,balanced,0.11763733625411987
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,4096,14336,2,8,16,4,power_law_1.2,0.05559679865837097
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,4096,14336,2,8,16,4,power_law_1.01,0.38096640110015867
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,4096,14336,2,8,16,4,power_law_1.01,0.09077759981155395
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,4096,14336,2,8,16,4,balanced,0.14499732851982117
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,4096,14336,2,8,16,4,power_law_1.01,0.06269440054893494
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,4096,14336,2,8,16,4,power_law_1.2,0.06172159910202026
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,4096,14336,2,8,16,4,power_law_1.01,0.7200960159301758
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,4096,14336,2,8,16,4,power_law_1.01,0.12176640033721924
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,4096,14336,2,8,16,4,power_law_1.01,0.060108798742294314
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,4096,14336,2,8,16,4,power_law_1.2,0.05625600218772888
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,4096,14336,2,8,16,4,power_law_1.01,0.9082367897033692
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,4096,14336,2,8,16,4,power_law_1.01,0.11704959869384765
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,4096,14336,2,8,16,4,balanced,0.21502399444580078
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,4096,14336,2,8,16,4,power_law_1.01,0.07508479952812194
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,4096,14336,2,8,16,4,power_law_1.2,0.05988479852676391
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,4096,14336,2,8,16,4,power_law_1.01,0.19259519577026368
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,4096,14336,2,8,16,4,power_law_1.01,1.2203583717346191
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,4096,14336,2,8,16,4,power_law_1.01,0.09139840006828308
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,4096,14336,2,8,16,4,balanced,0.29082133372624713
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,4096,14336,2,8,16,4,power_law_1.2,0.06627839803695679
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,4096,14336,2,8,16,4,power_law_1.01,0.10202239751815796
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,4096,14336,2,8,16,4,power_law_1.01,0.21476480960845948
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,4096,14336,2,8,16,4,power_law_1.01,2.293471908569336
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,4096,14336,2,8,16,4,power_law_1.2,0.08090239763259888
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,4096,14336,2,8,16,4,power_law_1.01,0.3057663917541504
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,4096,14336,2,8,16,4,balanced,0.42561066150665283
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,4096,14336,2,8,16,4,power_law_1.01,3.374739074707031
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,4096,14336,2,8,16,4,power_law_1.2,0.09463679790496826
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,4096,14336,2,8,16,4,power_law_1.01,0.13600640296936034
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,4096,14336,2,8,16,4,power_law_1.01,0.3987135887145996
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,4096,14336,2,8,16,4,power_law_1.2,0.11999360322952271
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,4096,14336,2,8,16,4,power_law_1.01,0.16858880519866942
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,4096,14336,2,8,16,4,power_law_1.01,0.5995903968811035
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,4096,14336,2,8,16,4,power_law_1.2,0.1466048002243042
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,4096,14336,2,8,16,4,balanced,0.5456639925638834
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,4096,14336,2,8,16,4,power_law_1.01,0.23469440937042235
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,4096,14336,2,8,16,4,power_law_1.2,0.14799360036849976
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,4096,14336,2,8,16,4,power_law_1.01,0.7803584098815918
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,4096,14336,2,8,16,4,power_law_1.01,0.3905344009399414
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,4096,14336,2,8,16,4,power_law_1.01,0.510975980758667
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,4096,14336,2,8,16,4,power_law_1.2,0.19429759979248046
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,4096,14336,2,8,16,4,power_law_1.01,1.019315242767334
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,4096,14336,2,8,16,4,power_law_1.01,0.7967232227325439
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,4096,14336,2,8,16,4,power_law_1.2,0.2442239999771118
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,4096,14336,2,8,16,4,balanced,0.6830560366312662
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,4096,14336,2,8,16,4,power_law_1.01,2.1004159927368162
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,4096,14336,2,8,16,4,power_law_1.01,0.968716812133789
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,4096,14336,2,8,16,4,power_law_1.01,1.2786623954772949
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,4096,14336,2,8,16,4,power_law_1.2,0.345798397064209
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,4096,14336,2,8,16,4,power_law_1.01,3.1730432510375977
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,4096,14336,2,8,16,4,power_law_1.01,1.5305855751037598
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,4096,14336,2,8,16,4,power_law_1.2,0.5256447792053223
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,4096,14336,2,8,16,4,power_law_1.01,2.729817581176758
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,4096,14336,2,8,16,4,power_law_1.2,0.6177663803100586
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,4096,14336,2,8,16,4,power_law_1.01,5.31207046508789
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,4096,14336,2,8,16,4,balanced,1.0801653067270915
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,4096,14336,2,8,16,4,power_law_1.2,1.1423232078552246
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,4096,14336,2,8,16,4,power_law_1.2,1.2690048217773438
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,4096,14336,2,8,16,4,power_law_1.2,2.434470367431641
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,4096,14336,2,8,16,4,power_law_1.2,3.3287872314453124
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,4096,14336,2,8,16,4,power_law_1.2,0.036652800440788266
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,4096,14336,2,8,16,4,balanced,2.124821345011393
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,4096,14336,2,8,16,4,power_law_1.2,0.03488639891147614
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,4096,14336,2,8,16,4,power_law_1.2,0.033657601475715636
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,4096,14336,2,8,16,4,power_law_1.2,0.03498240113258362
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,4096,14336,2,8,16,4,power_law_1.2,0.03505919873714447
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,4096,14336,2,8,16,4,power_law_1.2,0.03635840117931366
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,4096,14336,2,8,16,4,power_law_1.2,0.03654400110244751
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,4096,14336,2,8,16,4,power_law_1.2,0.03859840035438537
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,4096,14336,2,8,16,4,power_law_1.2,0.04049279987812042
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,4096,14336,2,8,16,4,power_law_1.2,0.04085760116577149
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,4096,14336,2,8,16,4,power_law_1.2,0.03959679901599884
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,4096,14336,2,8,16,4,power_law_1.2,0.04628480076789856
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,4096,14336,2,8,16,4,power_law_1.2,0.0495743989944458
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,4096,14336,2,8,16,4,power_law_1.2,0.05333120226860046
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,4096,14336,2,8,16,4,power_law_1.2,0.06173440217971802
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,4096,14336,2,8,16,4,power_law_1.2,0.07329279780387879
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,4096,14336,2,8,16,4,power_law_1.2,0.0657151997089386
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,4096,14336,2,8,16,4,power_law_1.2,0.08054400086402894
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,4096,14336,2,8,16,4,power_law_1.2,0.02627840042114258
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,4096,14336,2,8,16,4,power_law_1.2,0.09927679896354676
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,4096,14336,2,8,16,4,power_law_1.2,0.02648319900035858
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,4096,14336,2,8,16,4,power_law_1.2,0.11624319553375244
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,4096,14336,2,8,16,4,power_law_1.2,0.026182401180267333
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,4096,14336,2,8,16,4,power_law_1.2,0.12300159931182861
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,4096,14336,2,8,16,4,power_law_1.2,0.02805120050907135
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,4096,14336,2,8,16,4,power_law_1.2,0.20515201091766358
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,4096,14336,2,8,16,4,power_law_1.2,0.028512001037597656
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,4096,14336,2,8,16,4,power_law_1.2,0.2241663932800293
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,4096,14336,2,8,16,4,power_law_1.2,0.02932479977607727
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,4096,14336,2,8,16,4,power_law_1.2,0.34476161003112793
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,4096,14336,2,8,16,4,power_law_1.2,0.0297791987657547
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,4096,14336,2,8,16,4,power_law_1.2,0.03152639865875244
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,4096,14336,2,8,16,4,power_law_1.2,0.44133758544921875
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,4096,14336,2,8,16,4,power_law_1.2,0.03362559974193573
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,4096,14336,2,8,16,4,power_law_1.2,0.6006656169891358
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,4096,14336,2,8,16,4,power_law_1.2,0.033913600444793704
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,4096,14336,2,8,16,4,power_law_1.2,0.8739968299865722
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,4096,14336,2,8,32,2,balanced,0.02940800040960312
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,4096,14336,2,8,16,4,power_law_1.2,1.0057920455932616
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,4096,14336,2,8,16,4,power_law_1.2,0.03707520067691803
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,4096,14336,2,8,32,2,balanced,0.029578665892283123
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,4096,14336,2,8,16,4,power_law_1.2,1.5779647827148438
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,4096,14336,2,8,16,4,power_law_1.2,0.040870401263237
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,4096,14336,2,8,32,2,balanced,0.03408533334732056
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,4096,14336,2,8,16,4,power_law_1.2,3.3047489166259765
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,4096,14336,2,8,16,4,power_law_1.2,0.04217599928379059
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,4096,14336,2,8,32,2,balanced,0.04607999821503957
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,4096,14336,2,8,32,2,balanced,0.039664000272750854
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,4096,14336,2,8,16,4,power_law_1.2,0.05289599895477295
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,4096,14336,2,8,32,2,balanced,0.03952533255020777
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,4096,14336,2,8,32,2,balanced,0.04053333401679993
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,4096,14336,2,8,16,4,power_law_1.2,0.055404800176620486
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,4096,14336,2,8,32,2,balanced,0.04251733422279358
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,4096,14336,2,8,16,4,power_law_1.2,0.06083199977874756
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,4096,14336,2,8,32,2,balanced,0.04532266656557719
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,4096,14336,2,8,16,4,power_law_1.2,0.07479040026664734
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,4096,14336,2,8,32,2,balanced,0.04539733131726583
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,4096,14336,2,8,32,2,balanced,0.04204266766707102
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,4096,14336,2,8,16,4,power_law_1.2,0.08889600038528442
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,4096,14336,2,8,32,2,balanced,0.03161599983771642
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,4096,14336,2,8,32,2,balanced,0.04497066636880239
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,4096,14336,2,8,16,4,power_law_1.2,0.10387200117111206
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,4096,14336,2,8,32,2,balanced,0.03266666581233343
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,4096,14336,2,8,32,2,balanced,0.04394666850566864
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,4096,14336,2,8,32,2,balanced,0.034474665919939675
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,4096,14336,2,8,32,2,balanced,0.04577066500981649
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,4096,14336,2,8,32,2,balanced,0.03597866743803024
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,4096,14336,2,8,32,2,balanced,0.05977066854635874
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,4096,14336,2,8,16,4,power_law_1.2,0.1522752046585083
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,4096,14336,2,8,32,2,balanced,0.03638399889071783
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,4096,14336,2,8,32,2,balanced,0.06090133388837179
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,4096,14336,2,8,16,4,power_law_1.2,0.1730944037437439
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,4096,14336,2,8,32,2,balanced,0.03615466753641764
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,4096,14336,2,8,32,2,balanced,0.05606933434804281
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,4096,14336,2,8,32,2,balanced,0.036687999963760376
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,4096,14336,2,8,16,4,power_law_1.2,0.2854399919509888
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,4096,14336,2,8,32,2,balanced,0.06942399839560191
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,4096,14336,2,8,32,2,balanced,0.03660800059636434
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,4096,14336,2,8,16,4,power_law_1.2,0.3902208089828491
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,4096,14336,2,8,32,2,balanced,0.06543999910354614
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,4096,14336,2,8,32,2,power_law_1.01,0.029440000653266907
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,4096,14336,2,8,32,2,balanced,0.03709866603215536
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,4096,14336,2,8,16,4,power_law_1.2,0.6366079807281494
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,4096,14336,2,8,32,2,balanced,0.0895146628220876
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,4096,14336,2,8,32,2,balanced,0.03811199963092804
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,4096,14336,2,8,32,2,power_law_1.01,0.03278720080852508
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,4096,14336,2,8,16,4,power_law_1.2,0.7311295986175537
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,4096,14336,2,8,32,2,balanced,0.08808533350626628
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,4096,14336,2,8,32,2,balanced,0.03764266769091288
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,4096,14336,2,8,32,2,power_law_1.01,0.031667199730873105
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,4096,14336,2,8,16,4,power_law_1.2,1.2223423957824706
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,4096,14336,2,8,32,2,balanced,0.0379573330283165
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,4096,14336,2,8,32,2,power_law_1.01,0.04381439983844757
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,4096,14336,2,8,32,2,balanced,0.12762666742006937
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,4096,14336,2,8,16,4,power_law_1.2,1.5175935745239257
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,4096,14336,2,8,32,2,power_law_1.01,0.037920001149177554
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,4096,14336,2,8,32,2,balanced,0.03861333429813385
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,4096,14336,2,8,32,2,balanced,0.15093866984049478
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,4096,14336,2,8,16,4,power_law_1.2,1.6162879943847657
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,4096,14336,2,8,32,2,power_law_1.01,0.046911999583244324
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,4096,14336,2,8,32,2,balanced,0.03993066648642222
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,4096,14336,2,8,32,2,power_law_1.01,0.049497601389884946
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,4096,14336,2,8,32,2,balanced,0.025221332907676697
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,4096,14336,2,8,32,2,balanced,0.050288001696268715
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,4096,14336,2,8,16,4,power_law_1.2,2.7542655944824217
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,4096,14336,2,8,32,2,balanced,0.21708265940348306
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,4096,14336,2,8,32,2,power_law_1.01,0.03282560110092163
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,4096,14336,2,8,32,2,power_law_1.01,0.04624640047550201
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,4096,14336,2,8,32,2,balanced,0.02569599946339925
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,4096,14336,2,8,32,2,balanced,0.050741334756215416
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,4096,14336,2,8,16,4,power_law_1.2,5.635321426391601
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,4096,14336,2,8,32,2,power_law_1.01,0.04527359902858734
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,4096,14336,2,8,32,2,power_law_1.01,0.0323199987411499
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,4096,14336,2,8,32,2,balanced,0.26492265860239667
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,4096,14336,2,8,32,2,balanced,0.02640533447265625
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,4096,14336,2,8,32,2,balanced,0.050330668687820435
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,4096,14336,2,8,32,2,power_law_1.01,0.032358399033546446
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,4096,14336,2,8,32,2,power_law_1.01,0.047577598690986635
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,4096,14336,2,8,32,2,power_law_1.01,0.0349375993013382
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,4096,14336,2,8,32,2,balanced,0.02790933350721995
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,4096,14336,2,8,32,2,balanced,0.06514666477839152
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,4096,14336,2,8,32,2,power_law_1.01,0.026067200303077697
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,4096,14336,2,8,32,2,power_law_1.01,0.04459519982337952
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,4096,14336,2,8,32,2,power_law_1.01,0.03524479866027832
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,4096,14336,2,8,32,2,balanced,0.02914133419593175
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,4096,14336,2,8,32,2,power_law_1.01,0.036595198512077334
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,4096,14336,2,8,32,2,balanced,0.3821920156478882
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,4096,14336,2,8,32,2,power_law_1.01,0.04901120066642761
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,4096,14336,2,8,32,2,balanced,0.065610667069753
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,4096,14336,2,8,32,2,power_law_1.01,0.03749760091304779
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,4096,14336,2,8,32,2,power_law_1.01,0.026015999913215637
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,4096,14336,2,8,32,2,balanced,0.029215998947620392
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,4096,14336,2,8,32,2,power_law_1.01,0.03860479891300202
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,4096,14336,2,8,32,2,power_law_1.01,0.05533440113067627
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,4096,14336,2,8,32,2,balanced,0.08744000395139058
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,4096,14336,2,8,32,2,power_law_1.01,0.026259198784828186
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,4096,14336,2,8,32,2,power_law_1.01,0.039827200770378116
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,4096,14336,2,8,32,2,balanced,0.029834667841593426
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,4096,14336,2,8,32,2,power_law_1.01,0.06431360244750976
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,4096,14336,2,8,32,2,balanced,0.4976053237915039
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,4096,14336,2,8,32,2,power_law_1.01,0.040627199411392215
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,4096,14336,2,8,32,2,power_law_1.01,0.028364801406860353
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,4096,14336,2,8,32,2,balanced,0.09853333234786987
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,4096,14336,2,8,32,2,balanced,0.029711998999118805
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,4096,14336,2,8,32,2,power_law_1.01,0.038848000764846805
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,4096,14336,2,8,32,2,power_law_1.01,0.06977919936180114
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,4096,14336,2,8,32,2,power_law_1.01,0.04128639996051788
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,4096,14336,2,8,32,2,power_law_1.01,0.028838399052619933
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,4096,14336,2,8,32,2,power_law_1.01,0.0709824025630951
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,4096,14336,2,8,32,2,balanced,0.13780799508094788
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,4096,14336,2,8,32,2,power_law_1.01,0.04575360119342804
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,4096,14336,2,8,32,2,power_law_1.01,0.030636799335479737
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,4096,14336,2,8,32,2,power_law_1.01,0.07317119836807251
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,4096,14336,2,8,32,2,power_law_1.01,0.05120639801025391
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,4096,14336,2,8,32,2,balanced,0.030826665461063385
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,4096,14336,2,8,32,2,balanced,0.6102240085601807
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,4096,14336,2,8,32,2,balanced,0.1607360045115153
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,4096,14336,2,8,32,2,power_law_1.01,0.055276799201965335
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,4096,14336,2,8,32,2,power_law_1.01,0.03261440098285675
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,4096,14336,2,8,32,2,power_law_1.01,0.0890175998210907
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,4096,14336,2,8,32,2,power_law_1.01,0.06165760159492493
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,4096,14336,2,8,32,2,balanced,0.03142933299144109
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,4096,14336,2,8,32,2,power_law_1.01,0.03319680094718933
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,4096,14336,2,8,32,2,power_law_1.01,0.06783360242843628
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,4096,14336,2,8,32,2,power_law_1.01,0.08892160058021545
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,4096,14336,2,8,32,2,balanced,0.229967991511027
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,4096,14336,2,8,32,2,power_law_1.01,0.07715200185775757
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,4096,14336,2,8,32,2,power_law_1.01,0.11755520105361938
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,4096,14336,2,8,32,2,power_law_1.01,0.0896511971950531
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,4096,14336,2,8,32,2,power_law_1.01,0.10820480585098266
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,4096,14336,2,8,32,2,power_law_1.01,0.034297600388526917
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,4096,14336,2,8,32,2,balanced,0.2924853364626567
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,4096,14336,2,8,32,2,power_law_1.01,0.14508800506591796
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,4096,14336,2,8,32,2,balanced,0.9111626942952474
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,4096,14336,2,8,32,2,power_law_1.01,0.14156800508499146
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,4096,14336,2,8,32,2,power_law_1.01,0.035283198952674864
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,4096,14336,2,8,32,2,power_law_1.01,0.18411519527435302
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,4096,14336,2,8,32,2,power_law_1.01,0.16546560525894166
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,4096,14336,2,8,32,2,balanced,0.03257066756486893
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,4096,14336,2,8,32,2,power_law_1.01,0.24137599468231202
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,4096,14336,2,8,32,2,power_law_1.01,0.19668480157852172
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,4096,14336,2,8,32,2,balanced,0.42204801241556805
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,4096,14336,2,8,32,2,power_law_1.01,0.29900801181793213
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,4096,14336,2,8,32,2,balanced,0.033413333197434746
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,4096,14336,2,8,32,2,power_law_1.01,0.29482240676879884
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,4096,14336,2,8,32,2,power_law_1.01,0.43827199935913086
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,4096,14336,2,8,32,2,power_law_1.01,0.04047360122203827
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,4096,14336,2,8,32,2,power_law_1.01,0.36854400634765627
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,4096,14336,2,8,32,2,balanced,0.03495999922355016
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,4096,14336,2,8,32,2,power_law_1.01,0.5588096141815185
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,4096,14336,2,8,32,2,balanced,0.5418986479441324
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,4096,14336,2,8,32,2,power_law_1.01,0.5222464084625245
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,4096,14336,2,8,32,2,balanced,0.03516799956560135
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,4096,14336,2,8,32,2,power_law_1.01,0.04270080029964447
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,4096,14336,2,8,32,2,power_law_1.01,0.7844287872314453
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,4096,14336,2,8,32,2,power_law_1.01,0.8265088081359864
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,4096,14336,2,8,32,2,power_law_1.01,1.0385151863098145
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,4096,14336,2,8,32,2,power_law_1.01,0.04510720074176788
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,4096,14336,2,8,32,2,power_law_1.01,1.333414363861084
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,4096,14336,2,8,32,2,power_law_1.01,0.8961919784545899
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,4096,14336,2,8,32,2,power_law_1.01,0.04873600006103516
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,4096,14336,2,8,32,2,balanced,0.044677332043647766
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,4096,14336,2,8,32,2,balanced,0.6676479975382487
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,4096,14336,2,8,32,2,power_law_1.01,2.9066816329956056
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,4096,14336,2,8,32,2,balanced,1.717360019683838
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,4096,14336,2,8,32,2,power_law_1.01,1.7461503982543944
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,4096,14336,2,8,32,2,balanced,0.045509333411852516
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,4096,14336,2,8,32,2,power_law_1.01,0.05692800283432007
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,4096,14336,2,8,32,2,power_law_1.01,2.321504020690918
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,4096,14336,2,8,32,2,balanced,0.04930666585763296
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,4096,14336,2,8,32,2,power_law_1.01,0.06122879981994629
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,4096,14336,2,8,32,2,power_law_1.01,0.06808320283889771
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,4096,14336,2,8,32,2,balanced,1.030741294225057
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,4096,14336,2,8,32,2,balanced,0.0677706648906072
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,4096,14336,2,8,32,2,power_law_1.01,0.08261119723320007
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,4096,14336,2,8,32,2,balanced,0.07518399755160014
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,4096,14336,2,8,32,2,power_law_1.01,0.09887359738349914
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,4096,14336,2,8,32,2,balanced,0.09799999992052714
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,4096,14336,2,8,32,2,power_law_1.01,0.1328703999519348
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,4096,14336,2,8,32,2,balanced,2.032303969065348
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,4096,14336,2,8,32,2,power_law_1.2,0.02975359857082367
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,4096,14336,2,8,32,2,balanced,0.11730666955312093
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,4096,14336,2,8,32,2,power_law_1.01,0.17660160064697267
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,4096,14336,2,8,32,2,power_law_1.2,0.031711998581886294
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,4096,14336,2,8,32,2,power_law_1.01,0.2106175899505615
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,4096,14336,2,8,32,2,balanced,0.17865600188573202
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,4096,14336,2,8,32,2,power_law_1.2,0.03357439935207367
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,4096,14336,2,8,32,2,power_law_1.01,0.3159231901168823
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,4096,14336,2,8,32,2,power_law_1.2,0.0449535995721817
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,4096,14336,2,8,32,2,balanced,0.23242133855819702
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,4096,14336,2,8,32,2,power_law_1.01,0.5003392219543457
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,4096,14336,2,8,32,2,power_law_1.2,0.03866879940032959
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,4096,14336,2,8,32,2,balanced,0.33928000926971436
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,4096,14336,2,8,32,2,power_law_1.01,0.6734975814819336
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,4096,14336,2,8,32,2,power_law_1.2,0.04474239945411682
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,4096,14336,2,8,32,2,power_law_1.01,0.8512960433959961
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,4096,14336,2,8,32,2,power_law_1.2,0.04967679977416992
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,4096,14336,2,8,32,2,balanced,0.43938668568929035
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,4096,14336,2,8,32,2,power_law_1.01,1.4623488426208495
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,4096,14336,2,8,32,2,power_law_1.2,0.044172799587249754
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,4096,14336,2,8,32,2,power_law_1.01,1.6274175643920898
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,4096,14336,2,8,32,2,balanced,0.6473226547241211
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,4096,14336,2,8,32,2,power_law_1.2,0.04746879935264588
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,4096,14336,2,8,32,2,power_law_1.01,2.6287103652954102
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,4096,14336,2,8,32,2,power_law_1.2,0.047891199588775635
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,4096,14336,2,8,32,2,power_law_1.01,4.773337554931641
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,4096,14336,2,8,32,2,power_law_1.2,0.04475519955158234
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,4096,14336,2,8,32,2,balanced,0.8495946725209554
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,4096,14336,2,8,32,2,power_law_1.2,0.048793599009513855
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,4096,14336,2,8,32,2,power_law_1.2,0.054092800617218016
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,4096,14336,2,8,32,2,power_law_1.2,0.06398079991340637
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,4096,14336,2,8,32,2,balanced,1.0607786973317463
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,4096,14336,2,8,32,2,power_law_1.2,0.06951040029525757
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,4096,14336,2,8,32,2,power_law_1.2,0.07404800057411194
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,4096,14336,2,8,32,2,power_law_1.2,0.07751039862632751
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,4096,14336,2,8,32,2,power_law_1.2,0.09430400133132935
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,4096,14336,2,8,32,2,balanced,1.6852854092915852
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,4096,14336,2,8,32,2,power_law_1.2,0.08839679956436157
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,4096,14336,2,8,32,2,power_law_1.2,0.11436799764633179
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,4096,14336,2,8,32,2,power_law_1.2,0.14477440118789672
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,4096,14336,2,8,32,2,power_law_1.2,0.16880639791488647
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,4096,14336,2,8,32,2,power_law_1.2,0.23120639324188233
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,4096,14336,2,8,32,2,power_law_1.2,0.30779519081115725
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,4096,14336,2,8,32,2,power_law_1.2,0.4112256050109863
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,4096,14336,2,8,32,2,balanced,3.3267946243286133
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,4096,14336,2,8,32,2,power_law_1.2,0.6508992195129395
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,4096,14336,2,8,32,2,power_law_1.2,0.03356159925460815
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,4096,14336,2,8,32,2,power_law_1.2,0.8921088218688965
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,4096,14336,2,8,32,2,power_law_1.2,0.032179200649261476
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,4096,14336,2,8,32,2,power_law_1.2,1.000115203857422
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,4096,14336,2,8,32,2,power_law_1.2,0.03223040103912354
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,4096,14336,2,8,32,2,power_law_1.2,0.03505919873714447
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,4096,14336,2,8,32,2,power_law_1.2,1.4277376174926757
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,4096,14336,2,8,32,2,power_law_1.2,0.03489919900894165
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,4096,14336,2,8,32,2,power_law_1.2,0.03648000061511993
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,4096,14336,2,8,32,2,power_law_1.2,2.9309568405151367
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,4096,14336,2,8,32,2,power_law_1.2,0.03800959885120392
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,4096,14336,2,8,32,2,power_law_1.2,0.03790079951286316
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,4096,14336,2,8,32,2,power_law_1.2,0.039027199149131775
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,4096,14336,2,8,32,2,power_law_1.2,0.040115201473236085
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,4096,14336,2,8,32,2,power_law_1.2,0.039776000380516055
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,4096,14336,2,8,32,2,power_law_1.2,0.04259839951992035
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,4096,14336,2,8,32,2,power_law_1.2,0.043968001008033754
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,4096,14336,2,8,32,2,power_law_1.2,0.048230400681495665
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,4096,14336,2,8,32,2,power_law_1.2,0.0574720025062561
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,4096,14336,2,8,32,2,power_law_1.2,0.06232960224151611
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,4096,14336,2,8,32,2,power_law_1.2,0.06506239771842956
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,4096,14336,2,8,32,2,power_law_1.2,0.07685120105743408
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,4096,14336,2,8,32,2,power_law_1.2,0.08225280046463013
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,4096,14336,2,8,32,2,power_law_1.2,0.1086016058921814
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,4096,14336,2,8,32,2,power_law_1.2,0.13107839822769166
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,4096,14336,2,8,32,2,power_law_1.2,0.16877440214157105
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,4096,14336,2,8,32,2,power_law_1.2,0.22462079524993897
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,6144,16384,2,8,8,8,balanced,0.05712000032265981
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,4096,14336,2,8,32,2,power_law_1.2,0.3122688055038452
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,6144,16384,2,8,8,8,balanced,0.057189335425694786
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,4096,14336,2,8,32,2,power_law_1.2,0.42690558433532716
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,6144,16384,2,8,8,8,balanced,0.053120002150535583
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,4096,14336,2,8,32,2,power_law_1.2,0.5760960102081298
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,6144,16384,2,8,8,8,balanced,0.05209066470464071
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,4096,14336,2,8,32,2,power_law_1.2,0.7999296188354492
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,4096,14336,2,8,32,2,power_law_1.2,0.02587519884109497
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,4096,14336,2,8,32,2,power_law_1.2,0.9123135566711426
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,6144,16384,2,8,8,8,balanced,0.05209066470464071
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,4096,14336,2,8,32,2,power_law_1.2,1.2730815887451172
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,6144,16384,2,8,8,8,balanced,0.053226664662361145
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,4096,14336,2,8,32,2,power_law_1.2,0.02598400115966797
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,6144,16384,2,8,8,8,balanced,0.038719999293486275
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,4096,14336,2,8,32,2,power_law_1.2,2.877849578857422
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,6144,16384,2,8,8,8,balanced,0.0537066658337911
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,4096,14336,2,8,32,2,power_law_1.2,0.026419198513031004
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,6144,16384,2,8,8,8,balanced,0.04165866722663244
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,6144,16384,2,8,8,8,balanced,0.05754666527112325
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,4096,14336,2,8,32,2,power_law_1.2,0.029094401001930236
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,6144,16384,2,8,8,8,balanced,0.03940266619126002
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,6144,16384,2,8,8,8,balanced,0.05481599768002828
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,4096,14336,2,8,32,2,power_law_1.2,0.028838399052619933
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,6144,16384,2,8,8,8,balanced,0.03942933430274328
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,6144,16384,2,8,8,8,balanced,0.05399466554323832
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,4096,14336,2,8,32,2,power_law_1.2,0.031148800253868104
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,6144,16384,2,8,8,8,balanced,0.05367999772230784
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,6144,16384,2,8,8,8,balanced,0.04242666562398275
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,4096,14336,2,8,32,2,power_law_1.2,0.033081600069999696
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,6144,16384,2,8,8,8,balanced,0.041450666884581246
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,6144,16384,2,8,8,8,balanced,0.05477866530418396
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,4096,14336,2,8,32,2,power_law_1.2,0.03353599905967712
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,6144,16384,2,8,8,8,balanced,0.05524266759554545
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,6144,16384,2,8,8,8,balanced,0.04179200033346812
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,4096,14336,2,8,32,2,power_law_1.2,0.03534719944000244
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,6144,16384,2,8,8,8,balanced,0.05439466734727224
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,6144,16384,2,8,8,8,balanced,0.041434665520985924
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,6144,16384,2,8,8,8,balanced,0.042954668402671814
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,4096,14336,2,8,32,2,power_law_1.2,0.0359360009431839
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,6144,16384,2,8,8,8,balanced,0.06413866579532623
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,6144,16384,2,8,8,8,balanced,0.04338666796684265
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,6144,16384,2,8,8,8,balanced,0.06453866759936015
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,6144,16384,2,8,8,8,balanced,0.043231998880704246
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,6144,16384,2,8,8,8,balanced,0.06783466537793477
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,4096,14336,2,8,32,2,power_law_1.2,0.04090240001678467
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,6144,16384,2,8,8,8,balanced,0.044250667095184326
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,6144,16384,2,8,8,8,balanced,0.07721066474914551
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,4096,14336,2,8,32,2,power_law_1.2,0.0433023989200592
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,6144,16384,2,8,8,8,balanced,0.031231999397277832
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,6144,16384,2,8,8,8,balanced,0.045365333557128906
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,6144,16384,2,8,8,8,balanced,0.07298666735490163
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,4096,14336,2,8,32,2,power_law_1.2,0.044556799530982974
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,6144,16384,2,8,8,8,balanced,0.030853333572546642
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,6144,16384,2,8,8,8,balanced,0.045994664231936135
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,4096,14336,2,8,32,2,power_law_1.2,0.04783360064029694
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,6144,16384,2,8,8,8,balanced,0.10729066530863444
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,6144,16384,2,8,8,8,balanced,0.05453333258628845
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,6144,16384,2,8,8,8,balanced,0.030832000076770782
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,6144,16384,2,8,8,8,balanced,0.09914132952690125
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,4096,14336,2,8,32,2,power_law_1.2,0.05973759889602661
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,6144,16384,2,8,8,8,balanced,0.05547733108202616
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,6144,16384,2,8,8,8,balanced,0.032074667513370514
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,6144,16384,2,8,8,8,balanced,0.160970667997996
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,4096,14336,2,8,32,2,power_law_1.2,0.06496639847755432
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,6144,16384,2,8,8,8,balanced,0.060458665092786155
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,6144,16384,2,8,8,8,balanced,0.033013333876927696
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,4096,14336,2,8,32,2,power_law_1.2,0.0730239987373352
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,6144,16384,2,8,8,8,balanced,0.033626665671666466
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,6144,16384,2,8,8,8,balanced,0.06774400174617767
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,6144,16384,2,8,8,8,balanced,0.15406399965286255
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,6144,16384,2,8,8,8,balanced,0.033743999898433685
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,6144,16384,2,8,8,8,balanced,0.07187200089295705
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,4096,14336,2,8,32,2,power_law_1.2,0.08579840064048767
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,6144,16384,2,8,8,8,balanced,0.22014933824539185
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,6144,16384,2,8,8,8,balanced,0.03356799980004629
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,6144,16384,2,8,8,8,power_law_1.01,0.060864001512527466
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,6144,16384,2,8,8,8,balanced,0.09557867050170898
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,4096,14336,2,8,32,2,power_law_1.2,0.10390399694442749
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,6144,16384,2,8,8,8,balanced,0.035743998984495796
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,6144,16384,2,8,8,8,power_law_1.01,0.05597440004348755
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,6144,16384,2,8,8,8,balanced,0.10528000195821126
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,6144,16384,2,8,8,8,balanced,0.26574933528900146
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,6144,16384,2,8,8,8,balanced,0.037765334049860634
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,4096,14336,2,8,32,2,power_law_1.2,0.136735999584198
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,6144,16384,2,8,8,8,power_law_1.01,0.05175039768218994
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,6144,16384,2,8,8,8,balanced,0.14755200346310934
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,6144,16384,2,8,8,8,power_law_1.01,0.051551997661590576
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,6144,16384,2,8,8,8,balanced,0.3918293317159017
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,6144,16384,2,8,8,8,balanced,0.16412267088890076
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,4096,14336,2,8,32,2,power_law_1.2,0.1923200011253357
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,6144,16384,2,8,8,8,power_law_1.01,0.052147197723388675
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,4096,14336,2,8,32,2,power_law_1.2,0.29685120582580565
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,6144,16384,2,8,8,8,balanced,0.23119467496871948
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,6144,16384,2,8,8,8,power_law_1.01,0.05585920214653015
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,4096,14336,2,8,32,2,power_law_1.2,0.37662079334259035
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,6144,16384,2,8,8,8,balanced,0.4978080193201701
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,6144,16384,2,8,8,8,balanced,0.03523733218510946
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,6144,16384,2,8,8,8,power_law_1.01,0.05904639959335327
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,4096,14336,2,8,32,2,power_law_1.2,0.5059711933135986
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,6144,16384,2,8,8,8,balanced,0.28484266996383667
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,6144,16384,2,8,8,8,balanced,0.03594133257865906
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,6144,16384,2,8,8,8,power_law_1.01,0.05839999914169312
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,4096,14336,2,8,32,2,power_law_1.2,0.7064511775970459
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,6144,16384,2,8,8,8,balanced,0.03757333258787791
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,6144,16384,2,8,8,8,power_law_1.01,0.0607807993888855
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,6144,16384,2,8,8,8,balanced,0.6283573309580485
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,4096,14336,2,8,32,2,power_law_1.2,1.0165184020996094
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,6144,16384,2,8,8,8,balanced,0.037263999382654824
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,6144,16384,2,8,8,8,balanced,0.41386667887369794
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,6144,16384,2,8,8,8,power_law_1.01,0.06154239773750305
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,4096,14336,2,8,32,2,power_law_1.2,1.4345343589782715
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,6144,16384,2,8,8,8,power_law_1.01,0.0744383990764618
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,4096,14336,2,8,32,2,power_law_1.2,1.5501503944396973
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,6144,16384,2,8,8,8,balanced,0.5298080046971639
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,6144,16384,2,8,8,8,power_law_1.01,0.08566399812698364
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,4096,14336,2,8,32,2,power_law_1.2,2.9190528869628904
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,6144,16384,2,8,8,8,power_law_1.01,0.09291520118713378
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,6144,16384,2,8,8,8,balanced,0.9558719793955485
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,6144,16384,2,8,8,8,balanced,0.04688533147176107
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,6144,16384,2,8,8,8,power_law_1.01,0.0791167974472046
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,4096,14336,2,8,32,2,power_law_1.2,5.138438415527344
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,6144,16384,2,8,8,8,power_law_1.01,0.03573119938373566
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,6144,16384,2,8,8,8,balanced,0.04716266691684723
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,6144,16384,2,8,8,8,balanced,0.6600853204727173
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,6144,16384,2,8,8,8,power_law_1.01,0.09218559861183166
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,6144,16384,2,8,8,8,balanced,0.0496373325586319
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,6144,16384,2,8,8,8,power_law_1.01,0.03954559862613678
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,6144,16384,2,8,8,8,power_law_1.01,0.1029695987701416
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,6144,16384,2,8,8,8,power_law_1.01,0.036108800768852235
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,6144,16384,2,8,8,8,power_law_1.01,0.11991039514541627
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,6144,16384,2,8,8,8,power_law_1.01,0.0377920001745224
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,6144,16384,2,8,8,8,power_law_1.01,0.17031680345535277
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,6144,16384,2,8,8,8,balanced,1.0313226381937664
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,6144,16384,2,8,8,8,power_law_1.01,0.037785598635673524
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,6144,16384,2,8,8,8,power_law_1.01,0.17002880573272705
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,6144,16384,2,8,8,8,power_law_1.01,0.040729600191116336
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,6144,16384,2,8,8,8,balanced,1.8762292861938477
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,6144,16384,2,8,8,8,power_law_1.01,0.22753279209136962
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,6144,16384,2,8,8,8,balanced,0.06081599990526835
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,6144,16384,2,8,8,8,power_law_1.01,0.045100799202919005
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,6144,16384,2,8,8,8,power_law_1.01,0.24348158836364747
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,6144,16384,2,8,8,8,power_law_1.01,0.04755200147628784
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,6144,16384,2,8,8,8,balanced,0.06374933322270711
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,6144,16384,2,8,8,8,power_law_1.01,0.3148288011550903
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,6144,16384,2,8,8,8,power_law_1.01,0.05009920001029968
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,6144,16384,2,8,8,8,power_law_1.01,0.489247989654541
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,6144,16384,2,8,8,8,power_law_1.01,0.030355200171470642
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,6144,16384,2,8,8,8,power_law_1.01,0.05175039768218994
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,6144,16384,2,8,8,8,power_law_1.01,0.7686975955963135
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,6144,16384,2,8,8,8,power_law_1.01,0.05609599947929382
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,6144,16384,2,8,8,8,power_law_1.01,0.030246400833129884
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,6144,16384,2,8,8,8,balanced,2.005034605662028
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,6144,16384,2,8,8,8,power_law_1.01,0.8297535896301269
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,6144,16384,2,8,8,8,power_law_1.01,0.05878400206565857
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,6144,16384,2,8,8,8,power_law_1.01,0.030399999022483824
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,6144,16384,2,8,8,8,balanced,0.08040533463160197
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,6144,16384,2,8,8,8,power_law_1.01,0.06820480227470398
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,6144,16384,2,8,8,8,power_law_1.01,1.278054428100586
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,6144,16384,2,8,8,8,power_law_1.01,0.03224320113658905
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,6144,16384,2,8,8,8,power_law_1.01,0.05915520191192627
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,6144,16384,2,8,8,8,power_law_1.01,0.032307198643684386
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,6144,16384,2,8,8,8,power_law_1.01,1.7810239791870117
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,6144,16384,2,8,8,8,power_law_1.01,0.07724800109863281
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,6144,16384,2,8,8,8,power_law_1.01,0.03543039858341217
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,6144,16384,2,8,8,8,power_law_1.01,2.1607744216918947
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,6144,16384,2,8,8,8,power_law_1.01,0.08186879754066467
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,6144,16384,2,8,8,8,power_law_1.01,0.04059520065784454
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,6144,16384,2,8,8,8,balanced,0.09354666868845622
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,6144,16384,2,8,8,8,power_law_1.01,3.351289749145508
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,6144,16384,2,8,8,8,power_law_1.01,0.08628479838371277
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,6144,16384,2,8,8,8,power_law_1.01,0.041228801012039185
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,6144,16384,2,8,8,8,balanced,0.1290773351987203
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,6144,16384,2,8,8,8,power_law_1.01,0.11200640201568604
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,6144,16384,2,8,8,8,power_law_1.01,6.344601440429687
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,6144,16384,2,8,8,8,power_law_1.01,0.04629760086536407
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,6144,16384,2,8,8,8,power_law_1.2,0.060652798414230345
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,6144,16384,2,8,8,8,balanced,0.15413866440455118
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,6144,16384,2,8,8,8,power_law_1.01,0.12117760181427002
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,6144,16384,2,8,8,8,power_law_1.01,0.050886398553848265
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,6144,16384,2,8,8,8,power_law_1.2,0.056032001972198486
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,6144,16384,2,8,8,8,power_law_1.2,0.05182719826698303
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,6144,16384,2,8,8,8,power_law_1.01,0.181004798412323
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,6144,16384,2,8,8,8,power_law_1.2,0.051097601652145386
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,6144,16384,2,8,8,8,power_law_1.2,0.05172479748725891
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,6144,16384,2,8,8,8,power_law_1.01,0.20893440246582032
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,6144,16384,2,8,8,8,power_law_1.2,0.055379199981689456
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,6144,16384,2,8,8,8,power_law_1.01,0.047660800814628604
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,6144,16384,2,8,8,8,power_law_1.2,0.05909759998321533
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,6144,16384,2,8,8,8,power_law_1.01,0.2960576057434082
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,6144,16384,2,8,8,8,power_law_1.01,0.056518399715423585
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,6144,16384,2,8,8,8,power_law_1.2,0.057651197910308837
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,6144,16384,2,8,8,8,balanced,0.2195146679878235
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,6144,16384,2,8,8,8,power_law_1.01,0.3623296022415161
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,6144,16384,2,8,8,8,power_law_1.2,0.05998079776763916
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,6144,16384,2,8,8,8,power_law_1.01,0.05948160290718078
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,6144,16384,2,8,8,8,power_law_1.2,0.05996800065040588
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,6144,16384,2,8,8,8,power_law_1.01,0.512934398651123
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,6144,16384,2,8,8,8,power_law_1.2,0.07535359859466553
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,6144,16384,2,8,8,8,power_law_1.01,0.07665280103683472
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,6144,16384,2,8,8,8,balanced,0.2909333308537801
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,6144,16384,2,8,8,8,power_law_1.2,0.08478720188140869
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,6144,16384,2,8,8,8,power_law_1.2,0.09502720236778259
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,6144,16384,2,8,8,8,power_law_1.01,0.5835648059844971
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,6144,16384,2,8,8,8,power_law_1.2,0.07761920094490052
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,6144,16384,2,8,8,8,balanced,0.43854931990305585
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,6144,16384,2,8,8,8,power_law_1.2,0.09669119715690613
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,6144,16384,2,8,8,8,power_law_1.01,0.9206080436706543
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,6144,16384,2,8,8,8,power_law_1.01,0.07314559817314148
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,6144,16384,2,8,8,8,power_law_1.2,0.09968000054359435
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,6144,16384,2,8,8,8,power_law_1.01,1.248076820373535
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,6144,16384,2,8,8,8,power_law_1.2,0.12258559465408325
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,6144,16384,2,8,8,8,power_law_1.01,0.07951359748840332
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,6144,16384,2,8,8,8,power_law_1.2,0.17439359426498413
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,6144,16384,2,8,8,8,balanced,0.5767306486765543
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,6144,16384,2,8,8,8,power_law_1.01,0.10202879905700683
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,6144,16384,2,8,8,8,power_law_1.01,1.6568384170532227
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,6144,16384,2,8,8,8,power_law_1.2,0.1787775993347168
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,6144,16384,2,8,8,8,power_law_1.2,0.25046401023864745
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,6144,16384,2,8,8,8,power_law_1.01,2.458195114135742
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,6144,16384,2,8,8,8,power_law_1.2,0.2533056020736694
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,6144,16384,2,8,8,8,power_law_1.2,0.3621567964553833
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,6144,16384,2,8,8,8,power_law_1.01,0.11421439647674561
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,6144,16384,2,8,8,8,power_law_1.01,4.894764709472656
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,6144,16384,2,8,8,8,balanced,0.7174506982167562
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,6144,16384,2,8,8,8,power_law_1.2,0.5181759834289551
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,6144,16384,2,8,8,8,power_law_1.01,0.13835519552230835
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,6144,16384,2,8,8,8,power_law_1.2,0.7581439971923828
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,6144,16384,2,8,8,8,power_law_1.2,0.8748607635498047
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,6144,16384,2,8,8,8,power_law_1.2,1.2913023948669433
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,6144,16384,2,8,8,8,power_law_1.2,1.7873472213745116
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,6144,16384,2,8,8,8,power_law_1.01,0.20931200981140136
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,6144,16384,2,8,8,8,balanced,1.1365813414255779
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,6144,16384,2,8,8,8,power_law_1.2,2.2904640197753907
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,6144,16384,2,8,8,8,power_law_1.2,2.930438423156738
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,6144,16384,2,8,8,8,power_law_1.01,0.23918719291687013
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,6144,16384,2,8,8,8,power_law_1.01,0.42064638137817384
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,6144,16384,2,8,8,8,power_law_1.2,6.579885101318359
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,6144,16384,2,8,8,8,power_law_1.01,0.502784013748169
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,6144,16384,2,8,8,8,power_law_1.01,0.7568384170532226
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,6144,16384,2,8,8,8,power_law_1.01,0.9429632186889648
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,6144,16384,2,8,8,8,balanced,2.2266772588094077
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,6144,16384,2,8,8,8,power_law_1.01,1.3766655921936035
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,6144,16384,2,8,8,8,power_law_1.01,1.8846015930175781
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,6144,16384,2,8,8,8,power_law_1.01,2.206163215637207
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,6144,16384,2,8,8,8,power_law_1.01,3.9684864044189454
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,6144,16384,2,8,8,8,power_law_1.01,7.5349372863769535
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,6144,16384,2,8,8,8,power_law_1.2,0.03818880021572113
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,6144,16384,2,8,8,8,power_law_1.2,0.041843199729919435
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,6144,16384,2,8,8,8,power_law_1.2,0.038873600959777835
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,6144,16384,2,8,8,8,power_law_1.2,0.039628800749778745
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,6144,16384,2,8,8,8,power_law_1.2,0.040940800309181215
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,6144,16384,2,8,8,8,power_law_1.2,0.043398401141166686
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,6144,16384,2,8,8,8,power_law_1.2,0.04591360092163086
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,6144,16384,2,8,8,8,power_law_1.2,0.048332801461219786
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,6144,16384,2,8,8,8,power_law_1.2,0.05102720260620117
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,6144,16384,2,8,8,8,power_law_1.2,0.052832001447677614
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,6144,16384,2,8,8,8,power_law_1.2,0.03049600124359131
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,6144,16384,2,8,8,8,power_law_1.2,0.05603839755058289
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,6144,16384,2,8,8,8,power_law_1.2,0.03089280128479004
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,6144,16384,2,8,8,8,power_law_1.2,0.0637440025806427
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,6144,16384,2,8,8,8,power_law_1.2,0.03054080009460449
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,6144,16384,2,8,8,8,power_law_1.2,0.06695680022239685
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,6144,16384,2,8,8,8,power_law_1.2,0.03255040049552917
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,6144,16384,2,8,16,4,balanced,0.04430399835109711
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,6144,16384,2,8,8,8,power_law_1.2,0.061817598342895505
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,6144,16384,2,8,8,8,power_law_1.2,0.03232640027999878
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,6144,16384,2,8,16,4,balanced,0.04427200059096018
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,6144,16384,2,8,8,8,power_law_1.2,0.07415680289268493
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,6144,16384,2,8,8,8,power_law_1.2,0.035206401348114015
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,6144,16384,2,8,16,4,balanced,0.0489279975493749
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,6144,16384,2,8,8,8,power_law_1.2,0.08279680013656616
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,6144,16384,2,8,16,4,balanced,0.05175999800364176
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,6144,16384,2,8,8,8,power_law_1.2,0.040243199467658995
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,6144,16384,2,8,8,8,power_law_1.2,0.08346239924430847
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,6144,16384,2,8,16,4,balanced,0.052000001072883606
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,6144,16384,2,8,8,8,power_law_1.2,0.04469119906425476
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,6144,16384,2,8,8,8,power_law_1.2,0.11045119762420655
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,6144,16384,2,8,16,4,balanced,0.05305600166320801
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,6144,16384,2,8,8,8,power_law_1.2,0.04947839975357056
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,6144,16384,2,8,16,4,balanced,0.05294933418432871
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,6144,16384,2,8,8,8,power_law_1.2,0.12049920558929443
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,6144,16384,2,8,16,4,balanced,0.03684266656637192
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,6144,16384,2,8,8,8,power_law_1.2,0.05324159860610962
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,6144,16384,2,8,16,4,balanced,0.0532533327738444
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,6144,16384,2,8,8,8,power_law_1.2,0.15903359651565552
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,6144,16384,2,8,16,4,balanced,0.03722666700681051
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,6144,16384,2,8,16,4,balanced,0.053541332483291626
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,6144,16384,2,8,8,8,power_law_1.2,0.21408638954162598
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,6144,16384,2,8,16,4,balanced,0.0379573330283165
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,6144,16384,2,8,8,8,power_law_1.2,0.04810880124568939
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,6144,16384,2,8,16,4,balanced,0.053818667928377785
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,6144,16384,2,8,8,8,power_law_1.2,0.30796160697937014
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,6144,16384,2,8,16,4,balanced,0.038880000511805214
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,6144,16384,2,8,16,4,balanced,0.053488001227378845
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,6144,16384,2,8,8,8,power_law_1.2,0.06280320286750793
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,6144,16384,2,8,8,8,power_law_1.2,0.37036159038543703
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,6144,16384,2,8,16,4,balanced,0.04131199916203817
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,6144,16384,2,8,16,4,balanced,0.05397866666316986
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,6144,16384,2,8,8,8,power_law_1.2,0.06493440270423889
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,6144,16384,2,8,8,8,power_law_1.2,0.5354623794555664
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,6144,16384,2,8,16,4,balanced,0.0407679999868075
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,6144,16384,2,8,16,4,balanced,0.05397866666316986
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,6144,16384,2,8,8,8,power_law_1.2,0.07524480223655701
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,6144,16384,2,8,16,4,balanced,0.04074133435885111
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,6144,16384,2,8,16,4,balanced,0.05762666463851929
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,6144,16384,2,8,8,8,power_law_1.2,0.6454336166381835
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,6144,16384,2,8,16,4,balanced,0.06446933249632518
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,6144,16384,2,8,16,4,balanced,0.04031466692686081
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,6144,16384,2,8,8,8,power_law_1.2,0.939686393737793
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,6144,16384,2,8,8,8,power_law_1.2,0.0793727993965149
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,6144,16384,2,8,16,4,balanced,0.0651093324025472
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,6144,16384,2,8,16,4,balanced,0.04197333256403605
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,6144,16384,2,8,8,8,power_law_1.2,1.2786496162414551
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,6144,16384,2,8,8,8,power_law_1.2,0.08370559811592101
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,6144,16384,2,8,16,4,balanced,0.06776000062624614
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,6144,16384,2,8,16,4,balanced,0.043706665436426796
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,6144,16384,2,8,8,8,power_law_1.2,1.6382335662841796
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,6144,16384,2,8,8,8,power_law_1.2,0.09934719800949096
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,6144,16384,2,8,16,4,balanced,0.07484266658624013
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,6144,16384,2,8,16,4,balanced,0.0424586683511734
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,6144,16384,2,8,8,8,power_law_1.2,2.4952959060668944
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,6144,16384,2,8,16,4,balanced,0.0848533312479655
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,6144,16384,2,8,16,4,balanced,0.04206933577855428
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,6144,16384,2,8,16,4,balanced,0.10377599795659383
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,6144,16384,2,8,8,8,power_law_1.2,0.11548800468444824
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,6144,16384,2,8,16,4,balanced,0.04554666578769684
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,6144,16384,2,8,8,8,power_law_1.2,4.87006721496582
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,6144,16384,2,8,16,4,balanced,0.1341493328412374
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,6144,16384,2,8,8,8,power_law_1.2,0.13923200368881225
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,6144,16384,2,8,16,4,balanced,0.04692799846331278
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,6144,16384,2,8,16,4,balanced,0.1548640032609304
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,6144,16384,2,8,16,4,balanced,0.05600533386071523
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,6144,16384,2,8,16,4,balanced,0.05691199998060862
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,6144,16384,2,8,16,4,balanced,0.19814932346343994
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,6144,16384,2,8,8,8,power_law_1.2,0.21468160152435303
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,6144,16384,2,8,16,4,balanced,0.062080000837643944
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,6144,16384,2,8,16,4,balanced,0.2717439929644267
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,6144,16384,2,8,16,4,balanced,0.0722453345855077
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,6144,16384,2,8,8,8,power_law_1.2,0.24325120449066162
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,6144,16384,2,8,16,4,balanced,0.07487999896208446
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,6144,16384,2,8,16,4,balanced,0.2991466720898946
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,6144,16384,2,8,8,8,power_law_1.2,0.4181951999664307
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,6144,16384,2,8,16,4,balanced,0.10283733407656352
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,6144,16384,2,8,8,8,power_law_1.2,0.5094272136688233
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,6144,16384,2,8,16,4,power_law_1.01,0.053964799642562865
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,6144,16384,2,8,16,4,balanced,0.4352426528930664
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,6144,16384,2,8,16,4,balanced,0.028714666763941448
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,6144,16384,2,8,16,4,balanced,0.1251520017782847
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,6144,16384,2,8,16,4,power_law_1.01,0.038649600744247434
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,6144,16384,2,8,8,8,power_law_1.2,0.7650623798370362
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,6144,16384,2,8,16,4,power_law_1.01,0.04999040067195892
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,6144,16384,2,8,16,4,balanced,0.028778667251269024
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,6144,16384,2,8,16,4,power_law_1.01,0.0471807986497879
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,6144,16384,2,8,16,4,balanced,0.1563146710395813
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,6144,16384,2,8,16,4,power_law_1.01,0.03935360014438629
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,6144,16384,2,8,8,8,power_law_1.2,1.0326272010803224
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,6144,16384,2,8,16,4,balanced,0.564741333325704
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,6144,16384,2,8,16,4,power_law_1.01,0.050988799333572386
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,6144,16384,2,8,16,4,balanced,0.029893333713213604
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,6144,16384,2,8,16,4,power_law_1.01,0.03675520122051239
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,6144,16384,2,8,16,4,balanced,0.1951733430226644
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,6144,16384,2,8,16,4,power_law_1.01,0.051545602083206174
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,6144,16384,2,8,8,8,power_law_1.2,1.526534366607666
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,6144,16384,2,8,16,4,balanced,0.031210665901501972
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,6144,16384,2,8,16,4,power_law_1.01,0.038796800374984744
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,6144,16384,2,8,16,4,power_law_1.01,0.05578879714012146
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,6144,16384,2,8,16,4,balanced,0.03259200106064478
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,6144,16384,2,8,16,4,power_law_1.01,0.057011198997497556
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,6144,16384,2,8,8,8,power_law_1.2,1.933305549621582
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,6144,16384,2,8,16,4,power_law_1.01,0.039468801021575926
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,6144,16384,2,8,16,4,balanced,0.27241599559783936
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,6144,16384,2,8,16,4,balanced,0.6994667053222656
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,6144,16384,2,8,16,4,power_law_1.01,0.057631999254226685
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,6144,16384,2,8,16,4,balanced,0.03279466678698858
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,6144,16384,2,8,16,4,power_law_1.01,0.04213759899139404
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,6144,16384,2,8,8,8,power_law_1.2,2.3207424163818358
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,6144,16384,2,8,16,4,power_law_1.01,0.0590399980545044
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,6144,16384,2,8,16,4,balanced,0.03349333256483078
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,6144,16384,2,8,16,4,power_law_1.01,0.04505600035190582
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,6144,16384,2,8,16,4,power_law_1.01,0.06439039707183838
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,6144,16384,2,8,16,4,balanced,0.32606399059295654
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,6144,16384,2,8,8,8,power_law_1.2,3.8284160614013674
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,6144,16384,2,8,16,4,power_law_1.01,0.06384639739990235
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,6144,16384,2,8,16,4,balanced,0.03350399931271871
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,6144,16384,2,8,16,4,power_law_1.01,0.04620800018310547
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,6144,16384,2,8,16,4,power_law_1.01,0.07254400253295898
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,6144,16384,2,8,16,4,power_law_1.01,0.04796159863471985
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,6144,16384,2,8,16,4,power_law_1.01,0.07218559980392455
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,6144,16384,2,8,8,8,power_law_1.2,7.64092788696289
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,6144,16384,2,8,16,4,balanced,0.4710346857706706
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,6144,16384,2,8,16,4,balanced,1.1232000192006428
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,6144,16384,2,8,16,4,power_law_1.01,0.06529920101165772
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,6144,16384,2,8,16,4,power_law_1.01,0.04986880123615265
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,6144,16384,2,8,16,4,power_law_1.01,0.08220800161361694
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,6144,16384,2,8,16,4,balanced,0.03481066723664602
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,6144,16384,2,8,16,4,power_law_1.01,0.05340800285339355
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,6144,16384,2,8,16,4,power_law_1.01,0.08971520066261292
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,6144,16384,2,8,16,4,balanced,0.03758399933576584
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,6144,16384,2,8,16,4,balanced,0.6062826712926229
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,6144,16384,2,8,16,4,power_law_1.01,0.09820799827575684
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,6144,16384,2,8,16,4,power_law_1.01,0.055193597078323366
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,6144,16384,2,8,16,4,power_law_1.01,0.13401600122451782
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,6144,16384,2,8,16,4,power_law_1.01,0.11487360000610351
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,6144,16384,2,8,16,4,power_law_1.01,0.05690240263938904
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,6144,16384,2,8,16,4,power_law_1.01,0.17804800271987914
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,6144,16384,2,8,16,4,power_law_1.01,0.062412798404693604
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,6144,16384,2,8,16,4,power_law_1.01,0.22264959812164306
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,6144,16384,2,8,16,4,balanced,0.7477493286132812
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,6144,16384,2,8,16,4,power_law_1.01,0.06885120272636414
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,6144,16384,2,8,16,4,power_law_1.01,0.2929984092712402
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,6144,16384,2,8,16,4,power_law_1.01,0.030419200658798218
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,6144,16384,2,8,16,4,power_law_1.01,0.4137216091156006
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,6144,16384,2,8,16,4,balanced,2.1291893323262534
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,6144,16384,2,8,16,4,balanced,0.03633599976698557
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,6144,16384,2,8,16,4,power_law_1.01,0.07276800274848938
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,6144,16384,2,8,16,4,power_law_1.01,0.5994431972503662
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,6144,16384,2,8,16,4,power_law_1.01,0.02964479923248291
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,6144,16384,2,8,16,4,balanced,0.037258667250474296
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,6144,16384,2,8,16,4,power_law_1.01,0.07832959890365601
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,6144,16384,2,8,16,4,power_law_1.01,0.6486015796661377
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,6144,16384,2,8,16,4,power_law_1.01,0.030393600463867188
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,6144,16384,2,8,16,4,power_law_1.01,0.9779647827148438
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,6144,16384,2,8,16,4,balanced,0.03915199885765711
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,6144,16384,2,8,16,4,power_law_1.01,0.0985472023487091
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,6144,16384,2,8,16,4,balanced,1.1853013038635254
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,6144,16384,2,8,16,4,power_law_1.01,0.0316864013671875
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,6144,16384,2,8,16,4,power_law_1.01,1.3526528358459473
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,6144,16384,2,8,16,4,balanced,0.03972800076007843
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,6144,16384,2,8,16,4,power_law_1.01,0.1149183988571167
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,6144,16384,2,8,16,4,power_law_1.01,1.9271232604980468
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,6144,16384,2,8,16,4,power_law_1.01,0.03240320086479187
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,6144,16384,2,8,16,4,power_law_1.01,0.1441856026649475
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,6144,16384,2,8,16,4,power_law_1.01,3.591455841064453
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,6144,16384,2,8,16,4,power_law_1.01,0.03711999952793121
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,6144,16384,2,8,16,4,power_law_1.01,0.17958400249481202
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,6144,16384,2,8,16,4,power_law_1.01,5.377888107299805
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,6144,16384,2,8,16,4,power_law_1.01,0.24864640235900878
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,6144,16384,2,8,16,4,power_law_1.01,0.03832319974899292
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,6144,16384,2,8,16,4,power_law_1.01,0.040780800580978396
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,6144,16384,2,8,16,4,power_law_1.01,0.31607680320739745
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,6144,16384,2,8,16,4,balanced,0.05099200208981832
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,6144,16384,2,8,16,4,power_law_1.01,0.39089920520782473
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,6144,16384,2,8,16,4,balanced,2.282581329345703
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,6144,16384,2,8,16,4,power_law_1.01,0.042342400550842284
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,6144,16384,2,8,16,4,balanced,0.051498666405677795
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,6144,16384,2,8,16,4,power_law_1.01,0.5802752017974854
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,6144,16384,2,8,16,4,power_law_1.01,0.04510720074176788
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,6144,16384,2,8,16,4,balanced,0.054474666714668274
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,6144,16384,2,8,16,4,power_law_1.01,0.8470144271850586
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,6144,16384,2,8,16,4,power_law_1.01,0.9763072013854981
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,6144,16384,2,8,16,4,power_law_1.01,0.04911360144615173
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,6144,16384,2,8,16,4,power_law_1.01,1.2987263679504395
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,6144,16384,2,8,16,4,balanced,0.06887466708819072
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,6144,16384,2,8,16,4,power_law_1.01,0.05764480233192444
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,6144,16384,2,8,16,4,power_law_1.01,2.792857551574707
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,6144,16384,2,8,16,4,balanced,0.07573866844177246
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,6144,16384,2,8,16,4,power_law_1.01,0.05759360194206238
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,6144,16384,2,8,16,4,power_law_1.01,4.090310287475586
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,6144,16384,2,8,16,4,power_law_1.01,0.06666240096092224
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,6144,16384,2,8,16,4,balanced,0.09611733754475911
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,6144,16384,2,8,16,4,power_law_1.01,0.07064319849014282
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,6144,16384,2,8,16,4,balanced,0.1133013367652893
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,6144,16384,2,8,16,4,power_law_1.01,0.0777728021144867
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,6144,16384,2,8,16,4,power_law_1.01,0.09957119822502136
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,6144,16384,2,8,16,4,power_law_1.01,0.09965440034866332
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,6144,16384,2,8,16,4,balanced,0.16084266702334085
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,6144,16384,2,8,16,4,power_law_1.01,0.11582080125808716
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,6144,16384,2,8,16,4,balanced,0.20777066548665366
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,6144,16384,2,8,16,4,balanced,0.3153866728146871
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,6144,16384,2,8,16,4,power_law_1.01,0.1940160036087036
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,6144,16384,2,8,16,4,power_law_1.01,0.25647358894348143
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,6144,16384,2,8,16,4,balanced,0.40802133083343506
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,6144,16384,2,8,16,4,power_law_1.01,0.433292818069458
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,6144,16384,2,8,16,4,balanced,0.6040000120798746
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,6144,16384,2,8,16,4,power_law_1.01,0.5483520030975342
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,6144,16384,2,8,16,4,power_law_1.2,0.054476797580718994
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,6144,16384,2,8,16,4,power_law_1.01,0.728985595703125
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,6144,16384,2,8,16,4,power_law_1.2,0.053376001119613645
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,6144,16384,2,8,16,4,balanced,0.802560011545817
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,6144,16384,2,8,16,4,power_law_1.01,0.937388801574707
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,6144,16384,2,8,16,4,power_law_1.2,0.04713599979877472
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,6144,16384,2,8,16,4,power_law_1.01,1.5562623977661132
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,6144,16384,2,8,16,4,power_law_1.2,0.05056639909744263
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,6144,16384,2,8,16,4,power_law_1.01,1.7495807647705077
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,6144,16384,2,8,16,4,balanced,0.9941759904225668
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,6144,16384,2,8,16,4,power_law_1.2,0.05186560153961182
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,6144,16384,2,8,16,4,power_law_1.01,2.166444778442383
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,6144,16384,2,8,16,4,power_law_1.2,0.055731201171875
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,6144,16384,2,8,16,4,power_law_1.2,0.05735679864883423
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,6144,16384,2,8,16,4,power_law_1.01,4.192230224609375
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,6144,16384,2,8,16,4,power_law_1.2,0.058310401439666745
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,6144,16384,2,8,16,4,balanced,1.595205307006836
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,6144,16384,2,8,16,4,power_law_1.01,8.502566528320312
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,6144,16384,2,8,16,4,power_law_1.2,0.05975040197372437
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,6144,16384,2,8,16,4,power_law_1.2,0.06913920044898987
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,6144,16384,2,8,16,4,power_law_1.2,0.07183359861373902
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,6144,16384,2,8,16,4,power_law_1.2,0.07308800220489502
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,6144,16384,2,8,16,4,power_law_1.2,0.07486079931259156
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,6144,16384,2,8,16,4,power_law_1.2,0.07000319957733155
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,6144,16384,2,8,16,4,balanced,3.159791946411133
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,6144,16384,2,8,16,4,power_law_1.2,0.09406080245971679
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,6144,16384,2,8,16,4,power_law_1.2,0.10376319885253907
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,6144,16384,2,8,16,4,power_law_1.2,0.1076159954071045
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,6144,16384,2,8,16,4,power_law_1.2,0.1262336015701294
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,6144,16384,2,8,16,4,power_law_1.2,0.1324928045272827
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,6144,16384,2,8,16,4,power_law_1.2,0.18849920034408568
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,6144,16384,2,8,16,4,power_law_1.2,0.03906559944152832
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,6144,16384,2,8,16,4,power_law_1.2,0.21858561038970947
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,6144,16384,2,8,16,4,power_law_1.2,0.038950398564338684
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,6144,16384,2,8,16,4,power_law_1.2,0.295961594581604
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,6144,16384,2,8,16,4,power_law_1.2,0.0365119993686676
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,6144,16384,2,8,16,4,power_law_1.2,0.4027008056640625
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,6144,16384,2,8,16,4,power_law_1.2,0.03866240084171295
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,6144,16384,2,8,16,4,power_law_1.2,0.03022719919681549
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,6144,16384,2,8,16,4,power_law_1.2,0.5792895793914795
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,6144,16384,2,8,16,4,power_law_1.2,0.03916159868240356
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,6144,16384,2,8,16,4,power_law_1.2,0.04182400107383728
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,6144,16384,2,8,16,4,power_law_1.2,0.7905727863311768
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,6144,16384,2,8,16,4,power_law_1.2,0.030144000053405763
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,6144,16384,2,8,32,2,balanced,0.03939199944337209
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,6144,16384,2,8,16,4,power_law_1.2,0.04469760060310364
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,6144,16384,2,8,16,4,power_law_1.2,1.2531007766723632
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,6144,16384,2,8,16,4,power_law_1.2,0.030163198709487915
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,6144,16384,2,8,32,2,balanced,0.041349334021409355
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,6144,16384,2,8,16,4,power_law_1.2,0.0449535995721817
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,6144,16384,2,8,16,4,power_law_1.2,0.03191039860248566
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,6144,16384,2,8,16,4,power_law_1.2,1.2609024047851562
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,6144,16384,2,8,32,2,balanced,0.050240000089009605
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,6144,16384,2,8,16,4,power_law_1.2,0.047200000286102294
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,6144,16384,2,8,16,4,power_law_1.2,0.032204800844192506
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,6144,16384,2,8,16,4,power_law_1.2,1.9919231414794922
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,6144,16384,2,8,32,2,balanced,0.05115200082461039
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,6144,16384,2,8,16,4,power_law_1.2,0.049030399322509764
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,6144,16384,2,8,16,4,power_law_1.2,0.03731839954853058
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,6144,16384,2,8,16,4,power_law_1.2,2.383251190185547
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,6144,16384,2,8,32,2,balanced,0.05176533261934916
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,6144,16384,2,8,16,4,power_law_1.2,0.05425919890403748
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,6144,16384,2,8,16,4,power_law_1.2,0.03726080060005188
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,6144,16384,2,8,32,2,balanced,0.03443733354409536
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,6144,16384,2,8,32,2,balanced,0.05298133194446564
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,6144,16384,2,8,16,4,power_law_1.2,5.99530258178711
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,6144,16384,2,8,16,4,power_law_1.2,0.05653759837150574
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,6144,16384,2,8,32,2,balanced,0.05309866865475973
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,6144,16384,2,8,16,4,power_law_1.2,0.04056960046291351
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,6144,16384,2,8,32,2,balanced,0.03576533248027166
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,6144,16384,2,8,16,4,power_law_1.2,0.05786240100860596
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,6144,16384,2,8,32,2,balanced,0.05296533306439718
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,6144,16384,2,8,32,2,balanced,0.03872533390919367
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,6144,16384,2,8,16,4,power_law_1.2,0.05836799740791321
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,6144,16384,2,8,16,4,power_law_1.2,0.04268159866333008
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,6144,16384,2,8,32,2,balanced,0.05259199937184652
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,6144,16384,2,8,32,2,balanced,0.03922666609287262
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,6144,16384,2,8,16,4,power_law_1.2,0.07451519966125489
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,6144,16384,2,8,16,4,power_law_1.2,0.046348801255226134
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,6144,16384,2,8,32,2,balanced,0.053488001227378845
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,6144,16384,2,8,32,2,balanced,0.04277333120505015
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,6144,16384,2,8,16,4,power_law_1.2,0.08047360181808472
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,6144,16384,2,8,32,2,balanced,0.05584533512592316
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,6144,16384,2,8,32,2,balanced,0.042581334710121155
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,6144,16384,2,8,16,4,power_law_1.2,0.08918399810791015
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,6144,16384,2,8,32,2,balanced,0.0572213331858317
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,6144,16384,2,8,16,4,power_law_1.2,0.05067520141601563
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,6144,16384,2,8,32,2,balanced,0.042026668787002563
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,6144,16384,2,8,16,4,power_law_1.2,0.09734399914741516
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,6144,16384,2,8,32,2,balanced,0.05754133562246958
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,6144,16384,2,8,16,4,power_law_1.2,0.11802239418029785
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,6144,16384,2,8,16,4,power_law_1.2,0.05754240155220032
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,6144,16384,2,8,32,2,balanced,0.042362665136655174
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,6144,16384,2,8,32,2,balanced,0.05852266649405161
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,6144,16384,2,8,16,4,power_law_1.2,0.14595839977264405
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,6144,16384,2,8,16,4,power_law_1.2,0.05464959740638733
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,6144,16384,2,8,32,2,balanced,0.04390933116277059
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,6144,16384,2,8,32,2,balanced,0.06474666794141133
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,6144,16384,2,8,16,4,power_law_1.2,0.2119231939315796
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,6144,16384,2,8,16,4,power_law_1.2,0.0655232012271881
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,6144,16384,2,8,32,2,balanced,0.04513066510359446
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,6144,16384,2,8,32,2,balanced,0.06613866488138835
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,6144,16384,2,8,16,4,power_law_1.2,0.24318718910217285
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,6144,16384,2,8,32,2,balanced,0.04417600234349569
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,6144,16384,2,8,32,2,balanced,0.07085866729418437
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,6144,16384,2,8,16,4,power_law_1.2,0.34849278926849364
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,6144,16384,2,8,32,2,balanced,0.08454933762550354
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,6144,16384,2,8,16,4,power_law_1.2,0.07388799786567687
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,6144,16384,2,8,32,2,balanced,0.044624000787734985
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,6144,16384,2,8,16,4,power_law_1.2,0.49006080627441406
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,6144,16384,2,8,32,2,balanced,0.029103999336560566
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,6144,16384,2,8,32,2,balanced,0.0958666702111562
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,6144,16384,2,8,16,4,power_law_1.2,0.08268799781799316
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,6144,16384,2,8,32,2,balanced,0.04622933268547058
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,6144,16384,2,8,16,4,power_law_1.2,0.6137728214263916
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,6144,16384,2,8,16,4,power_law_1.2,0.1007040023803711
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,6144,16384,2,8,32,2,balanced,0.11023466785748799
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,6144,16384,2,8,32,2,balanced,0.029333333174387615
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,6144,16384,2,8,32,2,balanced,0.04958933095137278
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,6144,16384,2,8,16,4,power_law_1.2,0.7258111953735351
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,6144,16384,2,8,32,2,balanced,0.03211733450492223
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,6144,16384,2,8,32,2,balanced,0.14244799812634787
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,6144,16384,2,8,32,2,balanced,0.058287998040517174
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,6144,16384,2,8,16,4,power_law_1.2,1.4417216300964355
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,6144,16384,2,8,16,4,power_law_1.2,0.13164160251617432
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,6144,16384,2,8,32,2,balanced,0.033557333052158356
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,6144,16384,2,8,32,2,balanced,0.05966933568318685
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,6144,16384,2,8,32,2,balanced,0.1737013260523478
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,6144,16384,2,8,16,4,power_law_1.2,1.698636817932129
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,6144,16384,2,8,16,4,power_law_1.2,0.14977279901504517
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,6144,16384,2,8,32,2,balanced,0.035061334570248924
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,6144,16384,2,8,32,2,balanced,0.06512533128261566
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,6144,16384,2,8,16,4,power_law_1.2,2.913408088684082
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,6144,16384,2,8,32,2,balanced,0.23693867524464926
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,6144,16384,2,8,32,2,balanced,0.03588266670703888
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,6144,16384,2,8,16,4,power_law_1.2,0.18044159412384034
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,6144,16384,2,8,32,2,balanced,0.07884266475836436
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,6144,16384,2,8,16,4,power_law_1.2,4.483174514770508
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,6144,16384,2,8,32,2,balanced,0.036848001182079315
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,6144,16384,2,8,32,2,balanced,0.32571732997894287
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,6144,16384,2,8,16,4,power_law_1.2,0.2342144012451172
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,6144,16384,2,8,32,2,balanced,0.08922132849693298
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,6144,16384,2,8,32,2,balanced,0.03754133234421412
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,6144,16384,2,8,32,2,balanced,0.10786133011182149
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,6144,16384,2,8,32,2,balanced,0.3688746690750122
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,6144,16384,2,8,16,4,power_law_1.2,0.411513614654541
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,6144,16384,2,8,32,2,balanced,0.1267573336760203
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,6144,16384,2,8,16,4,power_law_1.2,0.5224192142486572
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,6144,16384,2,8,32,2,balanced,0.03890133400758108
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,6144,16384,2,8,32,2,balanced,0.18017599980036417
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,6144,16384,2,8,32,2,balanced,0.5332906643549601
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,6144,16384,2,8,16,4,power_law_1.2,0.7342591762542725
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,6144,16384,2,8,32,2,balanced,0.04121600091457367
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,6144,16384,2,8,16,4,power_law_1.2,1.0938495635986327
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,6144,16384,2,8,32,2,balanced,0.2156160076459249
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,6144,16384,2,8,32,2,balanced,0.7022026379903158
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,6144,16384,2,8,16,4,power_law_1.2,1.7096576690673828
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,6144,16384,2,8,32,2,balanced,0.31015467643737793
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,6144,16384,2,8,32,2,power_law_1.01,0.043033599853515625
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,6144,16384,2,8,16,4,power_law_1.2,2.138041687011719
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,6144,16384,2,8,32,2,balanced,0.3896373510360718
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,6144,16384,2,8,32,2,power_law_1.01,0.042438399791717527
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,6144,16384,2,8,32,2,balanced,0.04078399886687597
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,6144,16384,2,8,16,4,power_law_1.2,2.4585344314575197
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,6144,16384,2,8,32,2,balanced,0.8690026601155599
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,6144,16384,2,8,32,2,power_law_1.01,0.04472320079803467
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,6144,16384,2,8,32,2,balanced,0.04433066646258036
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,6144,16384,2,8,32,2,power_law_1.01,0.050911998748779295
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,6144,16384,2,8,16,4,power_law_1.2,4.383795166015625
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,6144,16384,2,8,32,2,balanced,0.5506720145543417
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,6144,16384,2,8,32,2,balanced,0.045882667104403176
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,6144,16384,2,8,32,2,power_law_1.01,0.05183359980583191
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,6144,16384,2,8,16,4,power_law_1.2,7.830892944335938
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,6144,16384,2,8,32,2,balanced,0.04760533571243286
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,6144,16384,2,8,32,2,power_law_1.01,0.05243520140647888
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,6144,16384,2,8,32,2,balanced,0.7419093449910482
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,6144,16384,2,8,32,2,balanced,1.3996319770812988
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,6144,16384,2,8,32,2,power_law_1.01,0.05308799743652344
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,6144,16384,2,8,32,2,power_law_1.01,0.05529599785804749
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,6144,16384,2,8,32,2,power_law_1.01,0.035846400260925296
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,6144,16384,2,8,32,2,power_law_1.01,0.059334397315979004
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,6144,16384,2,8,32,2,balanced,0.9168372948964437
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,6144,16384,2,8,32,2,power_law_1.01,0.03608959913253784
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,6144,16384,2,8,32,2,power_law_1.01,0.06001920104026794
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,6144,16384,2,8,32,2,balanced,0.06028266747792562
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,6144,16384,2,8,32,2,power_law_1.01,0.03551360070705414
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,6144,16384,2,8,32,2,power_law_1.01,0.06004480123519897
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,6144,16384,2,8,32,2,balanced,0.06234666705131531
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,6144,16384,2,8,32,2,power_law_1.01,0.038841599225997926
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,6144,16384,2,8,32,2,power_law_1.01,0.06255360245704651
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,6144,16384,2,8,32,2,balanced,0.06611733138561249
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,6144,16384,2,8,32,2,power_law_1.01,0.03891200125217438
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,6144,16384,2,8,32,2,power_law_1.01,0.06436480283737182
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,6144,16384,2,8,32,2,balanced,2.6626879374186196
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,6144,16384,2,8,32,2,balanced,1.4573440551757812
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,6144,16384,2,8,32,2,power_law_1.01,0.04226559996604919
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,6144,16384,2,8,32,2,power_law_1.01,0.06526079773902893
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,6144,16384,2,8,32,2,power_law_1.01,0.07416319847106934
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,6144,16384,2,8,32,2,power_law_1.01,0.04257279932498932
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,6144,16384,2,8,32,2,balanced,0.08793600400288899
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,6144,16384,2,8,32,2,power_law_1.01,0.08689280152320862
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,6144,16384,2,8,32,2,power_law_1.01,0.04339199960231781
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,6144,16384,2,8,32,2,balanced,0.09687999884287517
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,6144,16384,2,8,32,2,power_law_1.01,0.0865664005279541
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,6144,16384,2,8,32,2,power_law_1.01,0.04483200013637543
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,6144,16384,2,8,32,2,power_law_1.01,0.10663039684295654
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,6144,16384,2,8,32,2,power_law_1.01,0.0469760000705719
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,6144,16384,2,8,32,2,power_law_1.01,0.11257599592208863
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,6144,16384,2,8,32,2,power_law_1.01,0.048870399594306946
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,6144,16384,2,8,32,2,power_law_1.01,0.15898879766464233
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,6144,16384,2,8,32,2,balanced,2.8595199584960938
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,6144,16384,2,8,32,2,power_law_1.01,0.055327999591827395
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,6144,16384,2,8,32,2,power_law_1.01,0.17488640546798706
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,6144,16384,2,8,32,2,balanced,0.12690132856369019
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,6144,16384,2,8,32,2,power_law_1.01,0.22091519832611084
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,6144,16384,2,8,32,2,power_law_1.01,0.056953597068786624
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,6144,16384,2,8,32,2,balanced,0.16810667514801025
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,6144,16384,2,8,32,2,power_law_1.01,0.2793792009353638
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,6144,16384,2,8,32,2,power_law_1.01,0.05621119737625122
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,6144,16384,2,8,32,2,balanced,0.2622879942258199
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,6144,16384,2,8,32,2,power_law_1.01,0.4347968101501465
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,6144,16384,2,8,32,2,power_law_1.01,0.06550400257110596
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,6144,16384,2,8,32,2,power_law_1.01,0.6056704044342041
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,6144,16384,2,8,32,2,balanced,0.3304426670074463
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,6144,16384,2,8,32,2,power_law_1.01,0.07567999958992004
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,6144,16384,2,8,32,2,power_law_1.01,0.7795072078704834
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,6144,16384,2,8,32,2,balanced,0.4817599852879842
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,6144,16384,2,8,32,2,power_law_1.01,0.07290239930152893
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,6144,16384,2,8,32,2,power_law_1.01,1.0711935997009276
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,6144,16384,2,8,32,2,power_law_1.01,0.09829760193824769
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,6144,16384,2,8,32,2,balanced,0.6295946836471558
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,6144,16384,2,8,32,2,power_law_1.01,1.5858431816101075
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,6144,16384,2,8,32,2,power_law_1.01,0.1112064003944397
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,6144,16384,2,8,32,2,power_law_1.01,0.029260799288749695
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,6144,16384,2,8,32,2,power_law_1.01,2.3073728561401365
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,6144,16384,2,8,32,2,power_law_1.01,0.02924799919128418
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,6144,16384,2,8,32,2,power_law_1.01,0.13105920553207398
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,6144,16384,2,8,32,2,balanced,0.9274293581644694
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,6144,16384,2,8,32,2,power_law_1.01,0.030668801069259642
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,6144,16384,2,8,32,2,power_law_1.01,3.683193588256836
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,6144,16384,2,8,32,2,power_law_1.01,0.03386240005493164
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,6144,16384,2,8,32,2,power_law_1.01,0.17594239711761475
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,6144,16384,2,8,32,2,power_law_1.01,0.03466239869594574
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,6144,16384,2,8,32,2,power_law_1.01,0.21673600673675536
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,6144,16384,2,8,32,2,power_law_1.01,0.03790079951286316
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,6144,16384,2,8,32,2,balanced,1.2279146512349446
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,6144,16384,2,8,32,2,power_law_1.01,0.03917439877986908
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,6144,16384,2,8,32,2,power_law_1.01,0.28492801189422606
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,6144,16384,2,8,32,2,power_law_1.01,0.04206719994544983
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,6144,16384,2,8,32,2,power_law_1.01,0.3966592073440552
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,6144,16384,2,8,32,2,power_law_1.01,0.0436928004026413
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,6144,16384,2,8,32,2,balanced,1.5378880500793457
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,6144,16384,2,8,32,2,power_law_1.01,0.5202112197875977
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,6144,16384,2,8,32,2,power_law_1.01,0.043782401084899905
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,6144,16384,2,8,32,2,power_law_1.01,0.7064191818237304
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,6144,16384,2,8,32,2,power_law_1.01,0.05310720205307007
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,6144,16384,2,8,32,2,power_law_1.01,1.0602047920227051
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,6144,16384,2,8,32,2,power_law_1.01,0.05509759783744812
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,6144,16384,2,8,32,2,power_law_1.01,1.4476736068725586
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,6144,16384,2,8,32,2,balanced,2.4439199765523276
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,6144,16384,2,8,32,2,power_law_1.01,0.057183998823165896
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,6144,16384,2,8,32,2,power_law_1.01,0.062080001831054686
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,6144,16384,2,8,32,2,power_law_1.01,1.9226943969726562
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,6144,16384,2,8,32,2,power_law_1.01,4.227449417114258
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,6144,16384,2,8,32,2,power_law_1.01,0.07075200080871583
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,6144,16384,2,8,32,2,power_law_1.01,0.07904000282287597
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,6144,16384,2,8,32,2,power_law_1.01,0.08706560134887695
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,6144,16384,2,8,32,2,power_law_1.01,0.11793919801712036
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,6144,16384,2,8,32,2,power_law_1.01,0.16160639524459838
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,6144,16384,2,8,32,2,balanced,4.860032081604004
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,6144,16384,2,8,32,2,power_law_1.2,0.04131839871406555
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,6144,16384,2,8,32,2,power_law_1.01,0.22623999118804933
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,6144,16384,2,8,32,2,power_law_1.01,0.24138240814208983
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,6144,16384,2,8,32,2,power_law_1.2,0.041631999611854556
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,6144,16384,2,8,32,2,power_law_1.01,0.3872319936752319
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,6144,16384,2,8,32,2,power_law_1.2,0.043424001336097716
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,6144,16384,2,8,32,2,power_law_1.01,0.4437888145446777
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,6144,16384,2,8,32,2,power_law_1.01,0.7703167915344238
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,6144,16384,2,8,32,2,power_law_1.2,0.050809597969055174
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,6144,16384,2,8,32,2,power_law_1.01,0.857203197479248
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,6144,16384,2,8,32,2,power_law_1.2,0.051846402883529666
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,6144,16384,2,8,32,2,power_law_1.01,1.3019264221191407
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,6144,16384,2,8,32,2,power_law_1.2,0.0529151976108551
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,6144,16384,2,8,32,2,power_law_1.01,1.740185546875
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,6144,16384,2,8,32,2,power_law_1.01,2.0146560668945312
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,6144,16384,2,8,32,2,power_law_1.2,0.054662400484085084
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,6144,16384,2,8,32,2,power_law_1.01,3.350387191772461
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,6144,16384,2,8,32,2,power_law_1.2,0.05575039982795715
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,6144,16384,2,8,32,2,power_law_1.01,6.88695068359375
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,6144,16384,2,8,32,2,power_law_1.2,0.05854719877243042
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,6144,16384,2,8,32,2,power_law_1.2,0.06038399934768677
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,6144,16384,2,8,32,2,power_law_1.2,0.05986559987068176
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,6144,16384,2,8,32,2,power_law_1.2,0.06304640173912049
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,6144,16384,2,8,32,2,power_law_1.2,0.06442239880561829
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,6144,16384,2,8,32,2,power_law_1.2,0.03487359881401062
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,6144,16384,2,8,32,2,power_law_1.2,0.06543999910354614
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,6144,16384,2,8,32,2,power_law_1.2,0.035596799850463864
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,6144,16384,2,8,32,2,power_law_1.2,0.07624959945678711
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,6144,16384,2,8,32,2,power_law_1.2,0.0859008014202118
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,6144,16384,2,8,32,2,power_law_1.2,0.03648639917373657
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,6144,16384,2,8,32,2,power_law_1.2,0.091839998960495
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,6144,16384,2,8,32,2,power_law_1.2,0.03976959884166718
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,6144,16384,2,8,32,2,power_law_1.2,0.11050239801406861
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,6144,16384,2,8,32,2,power_law_1.2,0.04088320136070252
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,6144,16384,2,8,32,2,power_law_1.2,0.12099200487136841
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,6144,16384,2,8,32,2,power_law_1.2,0.04216960072517395
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,6144,16384,2,8,32,2,power_law_1.2,0.15860480070114136
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,6144,16384,2,8,32,2,power_law_1.2,0.04412800073623657
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,6144,16384,2,8,32,2,power_law_1.2,0.1881152033805847
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,6144,16384,2,8,32,2,power_law_1.2,0.04511359930038452
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,6144,16384,2,8,32,2,power_law_1.2,0.23447039127349853
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,6144,16384,2,8,32,2,power_law_1.2,0.04795520007610321
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,6144,16384,2,8,32,2,power_law_1.2,0.3506495952606201
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,6144,16384,2,8,32,2,power_law_1.2,0.047942399978637695
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,6144,16384,2,8,32,2,power_law_1.2,0.4763904094696045
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,6144,16384,2,8,32,2,power_law_1.2,0.048127999901771544
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,6144,16384,2,8,32,2,power_law_1.2,0.6395391941070556
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,6144,16384,2,8,32,2,power_law_1.2,0.05236480236053467
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,6144,16384,2,8,32,2,power_law_1.2,0.029145601391792297
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,6144,16384,2,8,32,2,power_law_1.2,0.8970047950744628
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,6144,16384,2,8,32,2,power_law_1.2,0.05454720258712768
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,6144,16384,2,8,32,2,power_law_1.2,1.1088000297546388
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,6144,16384,2,8,32,2,power_law_1.2,0.02951039969921112
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,6144,16384,2,8,32,2,power_law_1.2,0.06104959845542908
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,6144,16384,2,8,32,2,power_law_1.2,0.030022400617599487
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,6144,16384,2,8,32,2,power_law_1.2,1.351046371459961
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,6144,16384,2,8,32,2,power_law_1.2,0.07220479846000671
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,6144,16384,2,8,32,2,power_law_1.2,0.033964800834655764
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,6144,16384,2,8,32,2,power_law_1.2,2.3762943267822267
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,6144,16384,2,8,32,2,power_law_1.2,0.07544320225715637
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,6144,16384,2,8,32,2,power_law_1.2,0.034918400645256045
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,6144,16384,2,8,32,2,power_law_1.2,4.322969436645508
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,6144,16384,2,8,32,2,power_law_1.2,0.08026880025863647
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,6144,16384,2,8,32,2,power_law_1.2,0.03734399974346161
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,6144,16384,2,8,32,2,power_law_1.2,0.09850239753723145
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,6144,16384,2,8,32,2,power_law_1.2,0.039743998646736146
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,6144,16384,2,8,32,2,power_law_1.2,0.11780480146408082
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,6144,16384,2,8,32,2,power_law_1.2,0.041388800740242
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,6144,16384,2,8,32,2,power_law_1.2,0.13404799699783326
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,6144,16384,2,8,32,2,power_law_1.2,0.043987199664115906
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,6144,16384,2,8,32,2,power_law_1.2,0.17300479412078856
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,6144,16384,2,8,32,2,power_law_1.2,0.04535680115222931
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,6144,16384,2,8,32,2,power_law_1.2,0.24512639045715331
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,6144,16384,2,8,32,2,power_law_1.2,0.2827199935913086
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,6144,16384,2,8,32,2,power_law_1.2,0.05470079779624939
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,6144,16384,2,8,32,2,power_law_1.2,0.40787839889526367
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,6144,16384,2,8,32,2,power_law_1.2,0.05548800230026245
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,6144,16384,2,8,32,2,power_law_1.2,0.5835840225219726
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,6144,16384,2,8,32,2,power_law_1.2,0.061862397193908694
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,6144,16384,2,8,32,2,power_law_1.2,0.8435903549194336
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,6144,16384,2,8,32,2,power_law_1.2,0.0630016028881073
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,6144,16384,2,8,32,2,power_law_1.2,1.1105536460876464
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,7168,2048,8,256,1,64,balanced,0.1948960026105245
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,6144,16384,2,8,32,2,power_law_1.2,1.4545663833618163
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,6144,16384,2,8,32,2,power_law_1.2,0.07621759772300721
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,6144,16384,2,8,32,2,power_law_1.2,2.1715328216552736
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,7168,2048,8,256,1,64,balanced,0.18800532817840576
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,7168,2048,8,256,1,64,balanced,0.1923733353614807
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,6144,16384,2,8,32,2,power_law_1.2,0.08335999846458435
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,6144,16384,2,8,32,2,power_law_1.2,3.9013824462890625
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,7168,2048,8,256,1,64,balanced,0.20042133331298828
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,6144,16384,2,8,32,2,power_law_1.2,0.09447680115699768
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,7168,2048,8,256,1,64,balanced,0.3485226631164551
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,7168,2048,8,256,1,64,balanced,0.6583573420842489
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,6144,16384,2,8,32,2,power_law_1.2,0.11683199405670167
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,7168,2048,8,256,1,64,balanced,0.6876586278279623
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,6144,16384,2,8,32,2,power_law_1.2,0.13360639810562133
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,7168,2048,8,256,1,64,balanced,0.6823360125223795
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,7168,2048,8,256,1,64,balanced,0.7502079804738363
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,6144,16384,2,8,32,2,power_law_1.2,0.18913279771804808
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,7168,2048,8,256,1,64,balanced,0.6479680140813192
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,6144,16384,2,8,32,2,power_law_1.2,0.2810368061065674
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,7168,2048,8,256,1,64,balanced,0.6976053714752197
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,6144,16384,2,8,32,2,power_law_1.2,0.4603072166442871
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,7168,2048,8,256,1,64,balanced,0.6327733198801676
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,6144,16384,2,8,32,2,power_law_1.2,0.5239039897918701
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,7168,2048,8,256,1,64,balanced,0.7555200258890787
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,6144,16384,2,8,32,2,power_law_1.2,0.7019519805908203
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,7168,2048,8,256,1,64,balanced,0.1176533301671346
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,7168,2048,8,256,1,64,balanced,0.661850651105245
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,6144,16384,2,8,32,2,power_law_1.2,1.0181376457214355
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,7168,2048,8,256,1,64,balanced,0.12302399675051372
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,7168,2048,8,256,1,64,balanced,0.6672106583913168
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,7168,2048,8,256,1,64,balanced,0.11966933806737264
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,6144,16384,2,8,32,2,power_law_1.2,1.3586432456970214
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,7168,2048,8,256,1,64,balanced,0.6930773258209229
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,7168,2048,8,256,1,64,balanced,0.12245866656303406
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,7168,2048,8,256,1,64,balanced,0.20428266127904257
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,6144,16384,2,8,32,2,power_law_1.2,1.9662208557128906
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,7168,2048,8,256,1,64,balanced,0.6068053245544434
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,7168,2048,8,256,1,64,balanced,0.3670026858647664
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,7168,2048,8,256,1,64,balanced,0.7006293137868246
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,6144,16384,2,8,32,2,power_law_1.2,2.633171272277832
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,7168,2048,8,256,1,64,balanced,0.3708639939626058
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,7168,2048,8,256,1,64,balanced,0.37795201937357586
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,6144,16384,2,8,32,2,power_law_1.2,3.6424766540527345
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,7168,2048,8,256,1,64,balanced,0.6355253458023071
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,7168,2048,8,256,1,64,balanced,0.3736853202184041
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,6144,16384,2,8,32,2,power_law_1.2,7.778463745117188
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,7168,2048,8,256,1,64,balanced,0.36298668384552
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,7168,2048,8,256,1,64,balanced,0.6011733214060465
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,7168,2048,8,256,1,64,balanced,0.37407465775807697
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,7168,2048,8,256,1,64,balanced,0.5849706729253134
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,7168,2048,8,256,1,64,balanced,0.3613813320795695
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,7168,2048,8,256,1,64,balanced,0.37390931447347003
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,7168,2048,8,256,1,64,balanced,0.36049067974090576
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,7168,2048,8,256,1,64,balanced,0.506501317024231
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,7168,2048,8,256,1,64,balanced,0.048570667703946434
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,7168,2048,8,256,1,64,balanced,0.3819733460744222
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,7168,2048,8,256,1,64,balanced,0.048197334011395775
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,7168,2048,8,256,1,64,balanced,0.36416534582773846
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,7168,2048,8,256,1,64,power_law_1.01,0.6583551883697509
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,7168,2048,8,256,1,64,balanced,0.3645706574122111
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,7168,2048,8,256,1,64,balanced,0.0489333321650823
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,7168,2048,8,256,1,64,balanced,0.3599199851353963
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,7168,2048,8,256,1,64,power_law_1.01,0.6604800224304199
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,7168,2048,8,256,1,64,balanced,0.05421866476535797
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,7168,2048,8,256,1,64,balanced,0.3799146811167399
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,7168,2048,8,256,1,64,power_law_1.01,0.6133056163787842
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,7168,2048,8,256,1,64,balanced,0.0658133327960968
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,7168,2048,8,256,1,64,power_law_1.01,0.40033278465270994
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,7168,2048,8,256,1,64,balanced,0.9209226767222086
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,7168,2048,8,256,1,64,balanced,0.08930133779843648
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,7168,2048,8,256,1,64,balanced,0.3772266705830892
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,7168,2048,8,256,1,64,balanced,0.08558400472005208
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,7168,2048,8,256,1,64,power_law_1.01,0.6236159801483154
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,7168,2048,8,256,1,64,balanced,0.3582613468170166
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,7168,2048,8,256,1,64,balanced,0.08654933174451192
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,7168,2048,8,256,1,64,power_law_1.01,0.5829247951507568
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,7168,2048,8,256,1,64,balanced,0.08673600355784099
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,7168,2048,8,256,1,64,power_law_1.01,0.6324607849121093
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,7168,2048,8,256,1,64,balanced,0.35951467355092365
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,7168,2048,8,256,1,64,balanced,0.08703999718030293
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,7168,2048,8,256,1,64,balanced,0.6686399777730306
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,7168,2048,8,256,1,64,power_law_1.01,0.6574272155761719
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,7168,2048,8,256,1,64,power_law_1.01,0.382207989692688
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,7168,2048,8,256,1,64,balanced,0.08889066179593404
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,7168,2048,8,256,1,64,power_law_1.01,0.6775872230529785
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,7168,2048,8,256,1,64,balanced,0.08939199646313985
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,7168,2048,8,256,1,64,balanced,0.3545066515604655
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,7168,2048,8,256,1,64,power_law_1.01,0.3874176025390625
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,7168,2048,8,256,1,64,power_law_1.01,0.6773568153381347
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,7168,2048,8,256,1,64,balanced,0.09047466516494751
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,7168,2048,8,256,1,64,power_law_1.01,0.24828801155090333
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,7168,2048,8,256,1,64,balanced,0.09218133489290874
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,7168,2048,8,256,1,64,power_law_1.01,0.5678656101226807
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,7168,2048,8,256,1,64,balanced,0.32338666915893555
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,7168,2048,8,256,1,64,power_law_1.01,0.22349441051483154
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,7168,2048,8,256,1,64,balanced,0.09782399733861287
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,7168,2048,8,256,1,64,power_law_1.01,0.6257215976715088
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,7168,2048,8,256,1,64,power_law_1.01,0.28519039154052733
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,7168,2048,8,256,1,64,balanced,0.9741546312967936
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,7168,2048,8,256,1,64,balanced,0.0981066624323527
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,7168,2048,8,256,1,64,power_law_1.01,0.6119487762451172
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,7168,2048,8,256,1,64,power_law_1.01,0.3395776033401489
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,7168,2048,8,256,1,64,balanced,0.6366560061772665
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,7168,2048,8,256,1,64,balanced,0.10055999954541524
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,7168,2048,8,256,1,64,power_law_1.01,0.6082111835479737
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,7168,2048,8,256,1,64,power_law_1.01,0.35514240264892577
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,7168,2048,8,256,1,64,power_law_1.01,0.5976064205169678
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,7168,2048,8,256,1,64,power_law_1.01,0.34641280174255373
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,7168,2048,8,256,1,64,power_law_1.01,0.6157375812530518
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,7168,2048,8,256,1,64,power_law_1.01,0.3513407945632935
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,7168,2048,8,256,1,64,balanced,0.11174933115641277
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,7168,2048,8,256,1,64,power_law_1.01,0.5455808162689209
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,7168,2048,8,256,1,64,power_law_1.01,0.36017279624938964
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,7168,2048,8,256,1,64,balanced,0.5803306500116984
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,7168,2048,8,256,1,64,power_law_1.01,0.33350400924682616
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,7168,2048,8,256,1,64,power_law_1.01,0.7374335765838623
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,7168,2048,8,256,1,64,balanced,1.2781279881795247
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,7168,2048,8,256,1,64,power_law_1.01,0.3634687900543213
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,7168,2048,8,256,1,64,power_law_1.01,0.6927807807922364
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,7168,2048,8,256,1,64,power_law_1.01,0.3283967971801758
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,7168,2048,8,256,1,64,power_law_1.01,0.904640007019043
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,7168,2048,8,256,1,64,power_law_1.01,0.34350080490112306
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,256,1,64,balanced,0.1209333340326945
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,7168,2048,8,256,1,64,power_law_1.01,0.9152383804321289
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,7168,2048,8,256,1,64,balanced,0.8392000198364258
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,7168,2048,8,256,1,64,power_law_1.01,0.32108159065246583
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,7168,2048,8,256,1,64,power_law_1.01,1.1996095657348633
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,7168,2048,8,256,1,64,power_law_1.01,0.30675840377807617
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,256,1,64,balanced,0.13868799805641174
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,7168,2048,8,256,1,64,power_law_1.01,1.4998784065246582
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,7168,2048,8,256,1,64,power_law_1.01,0.3359872102737427
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,256,1,64,balanced,0.1506186624368032
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,7168,2048,8,256,1,64,power_law_1.01,0.40087041854858396
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,7168,2048,8,256,1,64,power_law_1.01,2.134457588195801
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,7168,2048,8,256,1,64,power_law_1.01,0.4302783966064453
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,7168,2048,8,256,1,64,power_law_1.01,2.6682048797607423
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,7168,2048,8,256,1,64,balanced,1.593488057454427
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,7168,2048,8,256,1,64,power_law_1.01,0.48363518714904785
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,7168,2048,8,256,1,64,power_law_1.01,3.7780479431152343
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,7168,2048,8,256,1,64,power_law_1.01,0.5567488193511962
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,7168,2048,8,256,1,64,balanced,1.098079999287923
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,7168,2048,8,256,1,64,power_law_1.01,0.7295231819152832
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,7168,2048,8,256,1,64,power_law_1.01,5.775673675537109
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,256,1,64,balanced,0.18313600619633993
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,7168,2048,8,256,1,64,power_law_1.01,0.8412287712097168
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,7168,2048,8,256,1,64,power_law_1.01,6.611039733886718
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,7168,2048,8,256,1,64,power_law_1.01,1.2612863540649415
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,256,1,64,balanced,0.21039466063181558
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,7168,2048,8,256,1,64,power_law_1.01,1.669856071472168
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,7168,2048,8,256,1,64,power_law_1.01,12.612767791748047
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,7168,2048,8,256,1,64,power_law_1.01,2.310598373413086
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,7168,2048,8,256,1,64,power_law_1.01,0.08536319732666016
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,256,1,64,balanced,0.29179733991622925
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,7168,2048,8,256,1,64,power_law_1.01,3.382771301269531
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,7168,2048,8,256,1,64,power_law_1.01,0.07945600152015686
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,7168,2048,8,256,1,64,power_law_1.01,21.92914581298828
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,7168,2048,8,256,1,64,balanced,1.3485120137532551
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,7168,2048,8,256,1,64,power_law_1.01,0.07344639897346497
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,7168,2048,8,256,1,64,power_law_1.01,3.7634815216064452
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,7168,2048,8,256,1,64,power_law_1.01,0.06873599886894226
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,7168,2048,8,256,1,64,power_law_1.01,0.07004160284996033
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,7168,2048,8,256,1,64,power_law_1.01,6.319827270507813
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,7168,2048,8,256,1,64,power_law_1.01,0.08423680067062378
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,256,1,64,balanced,0.3466506799062093
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,7168,2048,8,256,1,64,power_law_1.01,0.08389760255813598
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,7168,2048,8,256,1,64,balanced,2.6556426684061685
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,7168,2048,8,256,1,64,power_law_1.01,0.08714240193367004
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,7168,2048,8,256,1,64,power_law_1.01,12.548204803466797
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,7168,2048,8,256,1,64,power_law_1.01,0.08734719753265381
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,7168,2048,8,256,1,64,power_law_1.01,0.08847360014915466
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,7168,2048,8,256,1,64,power_law_1.01,0.09041280150413514
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,7168,2048,8,256,1,64,power_law_1.01,0.10126719474792481
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,7168,2048,8,256,1,64,power_law_1.2,0.6559167861938476
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,7168,2048,8,256,1,64,power_law_1.01,0.10094720125198364
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,256,1,64,balanced,0.4984320004781087
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,7168,2048,8,256,1,64,power_law_1.01,0.11857279539108276
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,7168,2048,8,256,1,64,power_law_1.2,0.6569087982177735
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,7168,2048,8,256,1,64,power_law_1.01,0.12434560060501099
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,7168,2048,8,256,1,64,power_law_1.2,0.36197121143341066
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,7168,2048,8,256,1,64,power_law_1.01,0.12521599531173705
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,7168,2048,8,256,1,64,power_law_1.2,0.42259840965270995
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,7168,2048,8,256,1,64,power_law_1.2,0.4960000038146973
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,7168,2048,8,256,1,64,power_law_1.01,0.14968960285186766
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,7168,2048,8,256,1,64,balanced,2.1235413551330566
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,7168,2048,8,256,1,64,power_law_1.2,0.5104320049285889
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,7168,2048,8,256,1,64,power_law_1.2,0.5491968154907226
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,7168,2048,8,256,1,64,power_law_1.2,0.5611648082733154
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,7168,2048,8,256,1,64,power_law_1.01,0.16970880031585694
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,7168,2048,8,256,1,64,power_law_1.2,0.6358784198760986
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,256,1,64,balanced,0.6532320181528727
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,7168,2048,8,256,1,64,power_law_1.2,0.5374335765838623
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,7168,2048,8,256,1,64,power_law_1.2,0.6853375911712647
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,256,1,64,power_law_1.01,0.16540160179138183
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,7168,2048,8,256,1,64,power_law_1.2,0.6590591907501221
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,256,1,64,power_law_1.01,0.20067200660705567
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,7168,2048,8,256,1,64,power_law_1.2,0.6301119804382325
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,256,1,64,power_law_1.01,0.2740607976913452
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,7168,2048,8,256,1,64,power_law_1.2,0.5835775852203369
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,7168,2048,8,256,1,64,power_law_1.2,0.5632063865661621
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,256,1,64,power_law_1.01,0.31198720932006835
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,7168,2048,8,256,1,64,power_law_1.2,0.5953023910522461
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,256,1,64,power_law_1.01,0.4119423866271973
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,7168,2048,8,256,1,64,power_law_1.2,0.559219217300415
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,7168,2048,8,256,1,64,power_law_1.2,0.6596352100372315
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,256,1,64,power_law_1.01,0.5924352169036865
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,256,1,64,balanced,0.8191466331481934
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,7168,2048,8,256,1,64,power_law_1.2,0.7931712150573731
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,256,1,64,power_law_1.01,0.8032383918762207
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,7168,2048,8,256,1,64,power_law_1.2,0.9277824401855469
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,256,1,64,power_law_1.01,1.1590784072875977
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,7168,2048,8,256,1,64,power_law_1.2,1.1140480041503906
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,256,1,64,power_law_1.01,1.5838720321655273
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,7168,2048,8,256,1,64,balanced,5.511903762817383
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,7168,2048,8,256,1,64,power_law_1.2,1.4516351699829102
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,256,1,64,power_law_1.01,1.8476800918579102
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,7168,2048,8,256,1,64,power_law_1.2,1.8829568862915038
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,256,1,64,power_law_1.01,3.294291305541992
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,7168,2048,8,256,1,64,power_law_1.2,0.3802175998687744
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,7168,2048,8,256,1,64,power_law_1.2,2.7090368270874023
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,7168,2048,8,256,1,64,power_law_1.2,0.38995840549468996
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,256,1,64,power_law_1.01,6.373088073730469
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,7168,2048,8,256,1,64,power_law_1.2,4.130265426635742
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,7168,2048,8,256,1,64,power_law_1.2,0.23227519989013673
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,7168,2048,8,256,1,64,power_law_1.2,5.7958526611328125
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,7168,2048,8,256,1,64,power_law_1.2,0.23527679443359376
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,7168,2048,8,256,1,64,power_law_1.2,0.32785921096801757
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,7168,2048,8,256,1,64,power_law_1.2,8.642412567138672
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,7168,2048,8,256,1,64,power_law_1.2,0.252729606628418
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,7168,2048,8,256,1,64,balanced,4.3089599609375
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,7168,2048,8,256,1,64,power_law_1.2,0.3481856107711792
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,7168,2048,8,256,1,64,power_law_1.2,11.254265594482423
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,256,1,64,balanced,1.281557321548462
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,7168,2048,8,256,1,64,power_law_1.2,0.3449280023574829
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,7168,2048,8,256,1,64,power_law_1.2,0.3269439935684204
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,7168,2048,8,256,1,64,power_law_1.2,19.912786865234374
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,7168,2048,8,256,1,64,power_law_1.2,0.3345088005065918
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,7168,2048,8,256,1,64,power_law_1.2,0.3477312088012695
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,7168,2048,8,256,1,64,power_law_1.2,0.3557888031005859
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,7168,2048,8,256,1,64,power_law_1.2,41.817953491210936
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,7168,2048,8,256,1,64,power_law_1.2,0.3287103891372681
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,7168,2048,8,256,1,64,power_law_1.2,0.3274816036224365
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,7168,2048,8,256,1,64,power_law_1.2,0.33130879402160646
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,7168,2048,8,256,1,64,power_law_1.2,0.32010879516601565
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,7168,2048,8,256,1,64,power_law_1.2,0.2996288061141968
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,7168,2048,8,256,1,64,power_law_1.2,0.3914560079574585
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,7168,2048,8,256,1,64,power_law_1.2,0.46040959358215333
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,7168,2048,8,256,1,64,power_law_1.2,0.5380095958709716
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,7168,2048,8,256,1,64,power_law_1.2,0.7198527812957763
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,7168,2048,8,256,1,64,power_law_1.2,0.8711999893188477
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,7168,2048,8,256,1,64,power_law_1.2,1.1240768432617188
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,7168,2048,8,256,1,64,power_law_1.2,1.8247615814208984
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,7168,2048,8,256,1,64,power_law_1.2,2.2834239959716798
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,7168,2048,8,256,1,64,power_law_1.2,3.0707136154174806
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,7168,2048,8,256,1,64,power_law_1.2,4.622982406616211
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,7168,2048,8,256,1,64,power_law_1.2,5.428569412231445
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,256,1,64,balanced,2.581482728322347
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,7168,2048,8,256,1,64,power_law_1.2,10.079673767089844
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,7168,2048,8,256,1,64,power_law_1.2,21.050630187988283
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,7168,2048,8,256,1,64,power_law_1.2,0.08150399923324585
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,7168,2048,8,256,1,64,power_law_1.2,0.07976319789886474
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,7168,2048,8,256,1,64,power_law_1.2,0.057529598474502563
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,7168,2048,8,256,2,32,balanced,0.06639466683069865
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,7168,2048,8,256,1,64,power_law_1.2,0.06613759994506836
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,7168,2048,8,256,1,64,power_law_1.2,0.07225599884986877
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,7168,2048,8,256,2,32,balanced,0.06406933565934499
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,7168,2048,8,256,2,32,balanced,0.05771199862162272
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,7168,2048,8,256,1,64,power_law_1.2,0.07253119945526124
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,7168,2048,8,256,2,32,balanced,0.06921599805355072
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,7168,2048,8,256,1,64,power_law_1.2,0.08420479893684388
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,7168,2048,8,256,2,32,balanced,0.08639466762542725
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,7168,2048,8,256,1,64,power_law_1.2,0.08244479894638061
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,7168,2048,8,256,2,32,balanced,0.12823466459910074
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,7168,2048,8,256,1,64,power_law_1.2,0.08627200126647949
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,7168,2048,8,256,2,32,balanced,0.12758400042851767
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,7168,2048,8,256,1,64,power_law_1.2,0.09133440256118774
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,7168,2048,8,256,2,32,balanced,0.1291039983431498
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,7168,2048,8,256,1,64,power_law_1.2,0.09717760086059571
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,7168,2048,8,256,2,32,balanced,0.12930132945378622
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,7168,2048,8,256,1,64,power_law_1.2,0.0972927987575531
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,7168,2048,8,256,2,32,balanced,0.13057600458463034
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,7168,2048,8,256,2,32,balanced,0.12930132945378622
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,7168,2048,8,256,1,64,power_law_1.2,0.10415359735488891
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,7168,2048,8,256,2,32,balanced,0.1307253340880076
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,7168,2048,8,256,1,64,power_law_1.2,0.11934080123901367
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,7168,2048,8,256,2,32,balanced,0.13077333569526672
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,7168,2048,8,256,1,64,power_law_1.2,0.12086399793624877
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,7168,2048,8,256,2,32,balanced,0.13372266292572021
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,7168,2048,8,256,1,64,power_law_1.2,0.134879994392395
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,7168,2048,8,256,2,32,balanced,0.13758933544158936
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,7168,2048,8,256,1,64,power_law_1.2,0.16366080045700074
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,7168,2048,8,256,2,32,balanced,0.1377173364162445
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,7168,2048,8,256,2,32,balanced,0.14315199851989746
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,7168,2048,8,256,1,64,power_law_1.2,0.19532159566879273
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,7168,2048,8,256,2,32,balanced,0.1499626636505127
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,7168,2048,8,256,2,32,balanced,0.15957333644231161
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,256,1,64,power_law_1.2,0.19690879583358764
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,7168,2048,8,256,2,32,balanced,0.05640000104904175
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,256,1,64,power_law_1.2,0.2380608081817627
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,7168,2048,8,256,2,32,balanced,0.17109866937001547
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,256,1,64,power_law_1.2,0.37431039810180666
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,7168,2048,8,256,2,32,balanced,0.04994133114814758
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,7168,2048,8,256,2,32,balanced,0.19271999597549438
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,7168,2048,8,256,2,32,balanced,0.0484746644894282
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,7168,2048,8,256,2,32,balanced,0.05658666789531708
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,256,1,64,power_law_1.2,0.37043840885162355
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,7168,2048,8,256,2,32,balanced,0.067930668592453
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,7168,2048,8,256,2,32,balanced,0.2129439910252889
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,256,1,64,power_law_1.2,0.5579135894775391
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,7168,2048,8,256,2,32,balanced,0.08806399504343669
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,256,1,64,power_law_1.2,0.9122176170349121
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,7168,2048,8,256,2,32,balanced,0.08986133337020874
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,7168,2048,8,256,2,32,balanced,0.09091732899347942
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,256,1,64,power_law_1.2,1.007808017730713
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,7168,2048,8,256,2,32,balanced,0.24606933196385702
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,7168,2048,8,256,2,32,balanced,0.09171733260154724
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,7168,2048,8,256,2,32,power_law_1.01,0.13015040159225463
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,256,1,64,power_law_1.2,1.7071552276611328
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,7168,2048,8,256,2,32,balanced,0.09231999516487122
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,7168,2048,8,256,2,32,balanced,0.04465599854787191
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,7168,2048,8,256,2,32,power_law_1.01,0.12067840099334717
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,7168,2048,8,256,2,32,balanced,0.09433066844940186
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,256,1,64,power_law_1.2,2.689017677307129
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,7168,2048,8,256,2,32,balanced,0.29999999205271405
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,7168,2048,8,256,2,32,balanced,0.045423999428749084
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,7168,2048,8,256,2,32,balanced,0.09496000409126282
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,7168,2048,8,256,2,32,power_law_1.01,0.10063359737396241
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,256,1,64,power_law_1.2,3.0880895614624024
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,7168,2048,8,256,2,32,balanced,0.04541333516438802
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,7168,2048,8,256,2,32,balanced,0.09684266646703084
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,7168,2048,8,256,2,32,power_law_1.01,0.07962239980697632
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,7168,2048,8,256,2,32,balanced,0.05442666510740916
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,7168,2048,8,256,2,32,balanced,0.09893332918485005
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,256,1,64,power_law_1.2,4.775238418579102
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,7168,2048,8,256,2,32,power_law_1.01,0.09752320051193238
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,7168,2048,8,256,2,32,power_law_1.01,0.08696960210800171
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,7168,2048,8,256,2,32,balanced,0.06758399804433186
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,7168,2048,8,256,2,32,balanced,0.10379733641942342
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,7168,2048,8,256,2,32,power_law_1.01,0.1058303952217102
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,7168,2048,8,256,2,32,balanced,0.35390400886535645
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,7168,2048,8,256,2,32,power_law_1.01,0.08256000280380249
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,7168,2048,8,256,2,32,balanced,0.08669333656628926
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,7168,2048,8,256,2,32,balanced,0.10690666238466899
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,256,1,64,power_law_1.2,9.350028991699219
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,7168,2048,8,256,2,32,power_law_1.01,0.06316800117492676
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,7168,2048,8,256,2,32,power_law_1.01,0.11783679723739623
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,7168,2048,8,256,2,32,balanced,0.1104906698067983
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,7168,2048,8,256,2,32,balanced,0.08827733000119527
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,7168,2048,8,256,2,32,power_law_1.01,0.06520959734916687
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,7168,2048,8,256,2,32,power_law_1.01,0.1202623963356018
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,7168,2048,8,256,2,32,power_law_1.01,0.07326080203056336
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,7168,2048,8,256,2,32,balanced,0.0883733332157135
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,7168,2048,8,256,2,32,balanced,0.12245333194732666
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,7168,2048,8,256,2,32,power_law_1.01,0.07863680124282837
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,7168,2048,8,256,2,32,power_law_1.01,0.12148480415344239
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,7168,2048,8,256,2,32,balanced,0.08975467085838318
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,7168,2048,8,256,2,32,power_law_1.01,0.0855679988861084
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,7168,2048,8,256,2,32,balanced,0.13154133160909018
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,7168,2048,8,256,2,32,power_law_1.01,0.1214784026145935
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,7168,2048,8,256,2,32,balanced,0.08957866827646892
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,7168,2048,8,256,2,32,power_law_1.01,0.08541439771652222
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,7168,2048,8,256,2,32,power_law_1.01,0.08789119720458985
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,7168,2048,8,256,2,32,balanced,0.15414933363596597
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,7168,2048,8,256,2,32,balanced,0.48815464973449707
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,7168,2048,8,256,2,32,balanced,0.09028266867001851
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,7168,2048,8,256,2,32,power_law_1.01,0.12314879894256592
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,7168,2048,8,256,2,32,power_law_1.01,0.08787840008735656
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,7168,2048,8,256,2,32,balanced,0.0921493371327718
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,7168,2048,8,256,2,32,power_law_1.01,0.09192320108413696
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,7168,2048,8,256,2,32,power_law_1.01,0.13255679607391357
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,7168,2048,8,256,2,32,balanced,0.17536532878875732
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,7168,2048,8,256,2,32,power_law_1.01,0.09228799939155578
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,7168,2048,8,256,2,32,balanced,0.09380799531936646
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,7168,2048,8,256,2,32,power_law_1.01,0.13175040483474731
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,7168,2048,8,256,2,32,power_law_1.01,0.0982208013534546
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,7168,2048,8,256,2,32,balanced,0.09482666850090027
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,7168,2048,8,256,2,32,power_law_1.01,0.10410879850387574
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,7168,2048,8,256,2,32,power_law_1.01,0.13923200368881225
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,7168,2048,8,256,2,32,balanced,0.2095253268877665
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,7168,2048,8,256,2,32,power_law_1.01,0.11371519565582275
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,7168,2048,8,256,2,32,balanced,0.10055999954541524
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,7168,2048,8,256,2,32,power_law_1.01,0.14991999864578248
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,7168,2048,8,256,2,32,power_law_1.01,0.12090239524841309
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,7168,2048,8,256,2,32,balanced,0.10292800267537434
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,7168,2048,8,256,2,32,power_law_1.01,0.11939840316772461
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,7168,2048,8,256,2,32,power_law_1.01,0.8660544395446778
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,7168,2048,8,256,2,32,power_law_1.01,0.14840320348739625
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,7168,2048,8,256,2,32,balanced,0.10578667124112447
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,7168,2048,8,256,2,32,balanced,0.2523733377456665
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,7168,2048,8,256,2,32,power_law_1.01,0.16134400367736818
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,7168,2048,8,256,2,32,balanced,0.5955573320388794
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,7168,2048,8,256,2,32,power_law_1.01,0.15062400102615356
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,7168,2048,8,256,2,32,power_law_1.01,0.1904703974723816
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,7168,2048,8,256,2,32,power_law_1.01,0.1848703980445862
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,7168,2048,8,256,2,32,power_law_1.01,0.2203968048095703
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,7168,2048,8,256,2,32,power_law_1.01,0.19145599603652955
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,7168,2048,8,256,2,32,power_law_1.01,0.2742464065551758
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,7168,2048,8,256,2,32,power_law_1.01,0.239737606048584
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,7168,2048,8,256,2,32,balanced,0.33083732922871906
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,7168,2048,8,256,2,32,power_law_1.01,0.3291584014892578
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,7168,2048,8,256,2,32,power_law_1.01,0.2512383937835693
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,7168,2048,8,256,2,32,balanced,0.11852799852689107
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,7168,2048,8,256,2,32,power_law_1.01,0.4931647777557373
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,7168,2048,8,256,2,32,power_law_1.01,0.30880639553070066
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,7168,2048,8,256,2,32,power_law_1.01,0.601087999343872
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,7168,2048,8,256,2,32,power_law_1.01,0.37845759391784667
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,7168,2048,8,256,2,32,power_law_1.01,0.8085311889648438
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,7168,2048,8,256,2,32,power_law_1.01,0.516755199432373
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,7168,2048,8,256,2,32,power_law_1.01,1.1004799842834472
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,7168,2048,8,256,2,32,balanced,0.40693867206573486
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,7168,2048,8,256,2,32,power_law_1.01,0.6016575813293457
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,7168,2048,8,256,2,32,power_law_1.01,1.3324864387512207
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,7168,2048,8,256,2,32,balanced,0.7663146654764811
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,7168,2048,8,256,2,32,power_law_1.01,0.8430272102355957
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,7168,2048,8,256,2,32,power_law_1.01,1.9435840606689454
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,7168,2048,8,256,2,32,power_law_1.01,1.140998363494873
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,256,2,32,balanced,0.12963733077049255
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,7168,2048,8,256,2,32,power_law_1.01,4.244953536987305
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,7168,2048,8,256,2,32,power_law_1.01,1.3986047744750976
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,7168,2048,8,256,2,32,power_law_1.01,0.08795520067214965
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,256,2,32,balanced,0.1492639978726705
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,7168,2048,8,256,2,32,power_law_1.01,2.1714431762695314
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,7168,2048,8,256,2,32,balanced,0.5753920078277588
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,7168,2048,8,256,2,32,power_law_1.01,0.0846015989780426
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,256,2,32,balanced,0.163290669520696
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,7168,2048,8,256,2,32,power_law_1.01,0.06555520296096802
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,7168,2048,8,256,2,32,power_law_1.01,4.723027038574219
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,7168,2048,8,256,2,32,power_law_1.01,0.06220800280570984
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,7168,2048,8,256,2,32,power_law_1.2,0.13006080389022828
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,7168,2048,8,256,2,32,power_law_1.01,0.06974080204963684
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,7168,2048,8,256,2,32,power_law_1.2,0.12003840208053589
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,7168,2048,8,256,2,32,power_law_1.01,0.07563520073890687
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,256,2,32,balanced,0.204202671845754
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,7168,2048,8,256,2,32,power_law_1.2,0.06984320282936096
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,7168,2048,8,256,2,32,power_law_1.01,0.08149120211601257
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,7168,2048,8,256,2,32,power_law_1.2,0.08032000064849854
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,7168,2048,8,256,2,32,balanced,0.7354293664296468
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,7168,2048,8,256,2,32,power_law_1.01,0.0892416000366211
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,7168,2048,8,256,2,32,power_law_1.2,0.08071680068969726
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,7168,2048,8,256,2,32,balanced,1.1249706745147705
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,256,2,32,balanced,0.23564799626668295
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,7168,2048,8,256,2,32,power_law_1.01,0.08596479892730713
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,7168,2048,8,256,2,32,power_law_1.2,0.09909120202064514
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,7168,2048,8,256,2,32,power_law_1.01,0.08609920144081115
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,7168,2048,8,256,2,32,power_law_1.2,0.11869440078735352
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,7168,2048,8,256,2,32,power_law_1.01,0.09131519794464112
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,256,2,32,balanced,0.33563733100891113
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,7168,2048,8,256,2,32,power_law_1.2,0.10607999563217163
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,7168,2048,8,256,2,32,power_law_1.2,0.1071552038192749
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,7168,2048,8,256,2,32,power_law_1.01,0.09970560073852539
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,7168,2048,8,256,2,32,power_law_1.2,0.1177024006843567
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,7168,2048,8,256,2,32,power_law_1.01,0.10607359409332276
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,7168,2048,8,256,2,32,power_law_1.2,0.12511359453201293
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,7168,2048,8,256,2,32,power_law_1.01,0.10800000429153442
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,256,2,32,balanced,0.4121439854303996
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,7168,2048,8,256,2,32,power_law_1.2,0.13904639482498168
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,7168,2048,8,256,2,32,power_law_1.01,0.11294080018997192
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,7168,2048,8,256,2,32,balanced,0.9145706494649252
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,7168,2048,8,256,2,32,power_law_1.2,0.1400063991546631
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,7168,2048,8,256,2,32,power_law_1.01,0.11963520050048829
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,7168,2048,8,256,2,32,power_law_1.2,0.3842175960540771
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,7168,2048,8,256,2,32,power_law_1.01,0.14440319538116456
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,7168,2048,8,256,2,32,power_law_1.2,1.1028736114501954
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,7168,2048,8,256,2,32,power_law_1.2,1.3600128173828125
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,7168,2048,8,256,2,32,power_law_1.01,0.15843839645385743
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,7168,2048,8,256,2,32,power_law_1.2,0.17167999744415283
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,7168,2048,8,256,2,32,power_law_1.2,0.20663039684295653
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,7168,2048,8,256,2,32,power_law_1.2,0.2119296073913574
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,256,2,32,balanced,0.6016639868418375
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,256,2,32,power_law_1.01,0.16344959735870362
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,7168,2048,8,256,2,32,power_law_1.2,0.2608576059341431
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,256,2,32,power_law_1.01,0.2116544008255005
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,7168,2048,8,256,2,32,power_law_1.2,0.2772608041763306
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,256,2,32,power_law_1.01,0.2740607976913452
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,7168,2048,8,256,2,32,power_law_1.2,0.37624320983886717
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,7168,2048,8,256,2,32,power_law_1.2,0.4580543994903564
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,256,2,32,power_law_1.01,0.3600127935409546
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,7168,2048,8,256,2,32,power_law_1.2,0.6177855968475342
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,7168,2048,8,256,2,32,balanced,1.3930400212605794
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,256,2,32,power_law_1.01,0.4178880214691162
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,7168,2048,8,256,2,32,power_law_1.2,0.800607967376709
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,256,2,32,balanced,0.7889653046925863
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,256,2,32,power_law_1.01,0.5451903820037842
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,7168,2048,8,256,2,32,power_law_1.2,1.2496895790100098
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,256,2,32,power_law_1.01,0.7711616039276123
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,7168,2048,8,256,2,32,power_law_1.2,1.4745087623596191
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,7168,2048,8,256,2,32,balanced,2.2414719263712564
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,7168,2048,8,256,2,32,power_law_1.2,2.0032255172729494
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,256,2,32,power_law_1.01,1.0710207939147949
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,7168,2048,8,256,2,32,power_law_1.2,3.0016319274902346
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,256,2,32,power_law_1.01,1.3635199546813965
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,256,2,32,power_law_1.01,1.8681407928466798
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,7168,2048,8,256,2,32,power_law_1.2,7.27852783203125
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,256,2,32,power_law_1.01,3.5058048248291014
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,256,2,32,balanced,0.9714132944742838
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,256,2,32,power_law_1.01,6.611698913574219
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,7168,2048,8,256,2,32,power_law_1.2,0.08201599717140198
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,7168,2048,8,256,2,32,power_law_1.2,0.08272640109062195
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,7168,2048,8,256,2,32,power_law_1.2,0.05358080267906189
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,7168,2048,8,256,2,32,power_law_1.2,0.06303359866142273
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,256,2,32,balanced,1.5275626182556152
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,7168,2048,8,256,2,32,power_law_1.2,0.07138559818267823
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,7168,2048,8,256,2,32,power_law_1.2,0.07773439884185791
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,7168,2048,8,256,2,32,balanced,2.7699947357177734
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,7168,2048,8,256,2,32,power_law_1.2,0.0831167995929718
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,7168,2048,8,256,2,32,power_law_1.2,0.08520960211753845
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,7168,2048,8,256,2,32,power_law_1.2,0.08698880076408386
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,7168,2048,8,256,2,32,power_law_1.2,0.0837119996547699
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,7168,2048,8,256,2,32,power_law_1.2,0.0926144003868103
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,7168,2048,8,256,2,32,power_law_1.2,0.09664000272750854
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,7168,2048,8,256,2,32,power_law_1.2,0.10071040391921997
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,7168,2048,8,256,2,32,power_law_1.2,0.10266879796981812
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,7168,2048,8,256,2,32,power_law_1.2,0.1164736032485962
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,7168,2048,8,256,2,32,power_law_1.2,0.12624000310897826
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,7168,2048,8,256,2,32,power_law_1.2,0.1295359969139099
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,7168,2048,8,256,2,32,power_law_1.2,0.15306240320205688
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,7168,2048,8,256,2,32,power_law_1.2,0.1536128044128418
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,7168,2048,8,256,2,32,power_law_1.2,0.21431679725646974
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,7168,2048,8,256,2,32,power_law_1.2,0.23388159275054932
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,7168,2048,8,256,2,32,power_law_1.2,0.3010240077972412
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,7168,2048,8,256,2,32,power_law_1.2,0.3596544027328491
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,7168,2048,8,256,2,32,power_law_1.2,0.5102272033691406
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,7168,2048,8,256,4,16,balanced,0.05588266750176748
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,7168,2048,8,256,2,32,power_law_1.2,0.6910719871520996
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,7168,2048,8,256,4,16,balanced,0.05690133571624756
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,256,2,32,balanced,3.06606388092041
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,7168,2048,8,256,2,32,power_law_1.2,0.09194239974021912
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,7168,2048,8,256,2,32,power_law_1.2,0.9717056274414062
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,7168,2048,8,256,4,16,balanced,0.05859733124574026
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,7168,2048,8,256,2,32,power_law_1.2,0.0840511977672577
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,7168,2048,8,256,2,32,power_law_1.2,1.3715519905090332
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,7168,2048,8,256,4,16,balanced,0.07008533179759979
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,7168,2048,8,256,2,32,power_law_1.2,0.05397760272026062
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,7168,2048,8,256,2,32,power_law_1.2,0.06287999749183655
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,7168,2048,8,256,4,16,balanced,0.08683733145395915
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,7168,2048,8,256,2,32,power_law_1.2,1.6136768341064454
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,7168,2048,8,256,2,32,power_law_1.2,0.06788480281829834
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,7168,2048,8,256,4,16,balanced,0.1270240048567454
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,7168,2048,8,256,2,32,power_law_1.2,0.07928959727287292
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,7168,2048,8,256,2,32,power_law_1.2,2.694508743286133
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,7168,2048,8,256,4,16,balanced,0.12846933801968893
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,7168,2048,8,256,2,32,power_law_1.2,0.07994239926338195
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,7168,2048,8,256,2,32,power_law_1.2,0.08472319841384887
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,7168,2048,8,256,4,16,balanced,0.12849066654841104
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,7168,2048,8,256,2,32,power_law_1.2,5.57696647644043
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,7168,2048,8,256,2,32,power_law_1.2,0.08542079925537109
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,7168,2048,8,256,4,16,balanced,0.12793599565823874
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,7168,2048,8,256,2,32,power_law_1.2,0.08687999844551086
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,7168,2048,8,256,2,32,power_law_1.2,0.09451519846916198
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,7168,2048,8,256,4,16,balanced,0.12868266304334006
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,7168,2048,8,256,2,32,power_law_1.2,0.09790080189704894
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,7168,2048,8,256,4,16,balanced,0.12994666894276938
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,7168,2048,8,256,2,32,power_law_1.2,0.10145920515060425
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,7168,2048,8,256,4,16,balanced,0.13134400049845377
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,7168,2048,8,256,2,32,power_law_1.2,0.10618239641189575
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,7168,2048,8,256,2,32,power_law_1.2,0.12251520156860352
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,7168,2048,8,256,4,16,balanced,0.1318773329257965
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,7168,2048,8,256,2,32,power_law_1.2,0.13339519500732422
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,7168,2048,8,256,2,32,power_law_1.2,0.1442304015159607
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,7168,2048,8,256,4,16,balanced,0.13403733571370444
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,7168,2048,8,256,4,16,balanced,0.13924800356229147
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,7168,2048,8,256,2,32,power_law_1.2,0.17961599826812744
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,7168,2048,8,256,4,16,balanced,0.13970667123794556
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,7168,2048,8,256,4,16,balanced,0.1458186705907186
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,256,2,32,power_law_1.2,0.18867199420928954
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,7168,2048,8,256,4,16,balanced,0.1541973352432251
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,256,2,32,power_law_1.2,0.2601344108581543
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,256,2,32,power_law_1.2,0.3087680101394653
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,7168,2048,8,256,4,16,balanced,0.16409066319465637
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,256,2,32,power_law_1.2,0.3807615995407104
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,7168,2048,8,256,4,16,balanced,0.1882879932721456
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,256,2,32,power_law_1.2,0.5663296222686768
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,256,2,32,power_law_1.2,0.7045440196990966
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,7168,2048,8,256,4,16,balanced,0.20115200678507486
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,256,2,32,power_law_1.2,1.1107839584350585
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,7168,2048,8,256,4,16,balanced,0.2294399936993917
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,256,2,32,power_law_1.2,1.5065279960632325
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,256,2,32,power_law_1.2,2.12476806640625
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,256,2,32,power_law_1.2,2.793132781982422
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,7168,2048,8,256,4,16,balanced,0.2749333381652832
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,256,2,32,power_law_1.2,4.37468147277832
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,256,2,32,power_law_1.2,10.078067016601562
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,7168,2048,8,256,4,16,balanced,0.326474666595459
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,7168,2048,8,256,4,16,balanced,0.047450666626294456
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,7168,2048,8,256,4,16,balanced,0.04863466819127401
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,7168,2048,8,256,4,16,balanced,0.04889066517353058
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,7168,2048,8,256,4,16,balanced,0.40848533312479657
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,7168,2048,8,256,4,16,balanced,0.05611200133959452
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,7168,2048,8,256,4,16,balanced,0.06930666665236156
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,7168,2048,8,256,4,16,balanced,0.09025067090988159
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,7168,2048,8,256,4,16,balanced,0.09168533484141032
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,7168,2048,8,256,4,16,balanced,0.04529599845409393
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,7168,2048,8,256,4,16,power_law_1.01,0.09434239864349366
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,7168,2048,8,256,4,16,balanced,0.09322667121887207
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,7168,2048,8,256,4,16,balanced,0.0938933293024699
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,7168,2048,8,256,4,16,balanced,0.04590400060017904
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,7168,2048,8,256,4,16,power_law_1.01,0.12958719730377197
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,7168,2048,8,256,4,16,balanced,0.5594346523284912
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,7168,2048,8,256,4,16,balanced,0.09403199950853984
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,7168,2048,8,256,4,16,balanced,0.04688533147176107
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,7168,2048,8,256,4,16,power_law_1.01,0.07830399870872498
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,7168,2048,8,256,4,16,balanced,0.0582826683918635
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,7168,2048,8,256,4,16,balanced,0.09629866480827332
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,7168,2048,8,256,4,16,power_law_1.01,0.07459200024604798
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,7168,2048,8,256,4,16,balanced,0.06983999907970428
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,7168,2048,8,256,4,16,balanced,0.09702933828035991
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,7168,2048,8,256,4,16,power_law_1.01,0.08459519743919372
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,7168,2048,8,256,4,16,balanced,0.09026666482289632
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,7168,2048,8,256,4,16,balanced,0.09918399651845296
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,7168,2048,8,256,4,16,power_law_1.01,0.09773439764976502
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,7168,2048,8,256,4,16,balanced,0.09153599540392558
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,7168,2048,8,256,4,16,balanced,0.10006933410962422
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,7168,2048,8,256,4,16,power_law_1.01,0.1139456033706665
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,7168,2048,8,256,4,16,balanced,0.09250133236249287
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,7168,2048,8,256,4,16,balanced,0.10603200395901997
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,7168,2048,8,256,4,16,balanced,0.09324799974759419
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,7168,2048,8,256,4,16,power_law_1.01,0.1161471962928772
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,7168,2048,8,256,4,16,balanced,0.7444586753845215
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,7168,2048,8,256,4,16,balanced,0.10832533240318298
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,7168,2048,8,256,4,16,balanced,0.09378133217493693
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,7168,2048,8,256,4,16,power_law_1.01,0.1191167950630188
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,7168,2048,8,256,4,16,balanced,0.11319466431935628
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,7168,2048,8,256,4,16,balanced,0.09474666913350423
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,7168,2048,8,256,4,16,power_law_1.01,0.1135103940963745
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,7168,2048,8,256,4,16,balanced,0.12731200456619263
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,7168,2048,8,256,4,16,balanced,0.09566932916641235
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,7168,2048,8,256,4,16,power_law_1.01,0.12743040323257446
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,7168,2048,8,256,4,16,balanced,0.09809600313504536
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,7168,2048,8,256,4,16,balanced,0.14073066910107931
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,7168,2048,8,256,4,16,power_law_1.01,0.12460800409317016
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,7168,2048,8,256,4,16,power_law_1.01,0.06954879760742187
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,7168,2048,8,256,4,16,balanced,0.10050132870674133
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,7168,2048,8,256,4,16,power_law_1.01,0.12899839878082275
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,7168,2048,8,256,4,16,balanced,0.16355199615160623
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,7168,2048,8,256,4,16,balanced,0.10604799787203471
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,7168,2048,8,256,4,16,power_law_1.01,0.08844799995422363
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,7168,2048,8,256,4,16,power_law_1.01,0.13872640132904052
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,7168,2048,8,256,4,16,balanced,0.10853333274523418
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,7168,2048,8,256,4,16,power_law_1.01,0.054739201068878175
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,7168,2048,8,256,4,16,balanced,0.18547733624776205
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,7168,2048,8,256,4,16,power_law_1.01,0.3896512031555176
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,7168,2048,8,256,4,16,balanced,0.11473066608111064
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,7168,2048,8,256,4,16,power_law_1.01,0.06135680079460144
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,7168,2048,8,256,4,16,balanced,0.9480053583780924
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,7168,2048,8,256,4,16,power_law_1.01,0.39375360012054444
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,7168,2048,8,256,4,16,power_law_1.01,0.06677759885787964
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,7168,2048,8,256,4,16,balanced,0.2270560065905253
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,7168,2048,8,256,4,16,power_law_1.01,0.15928959846496582
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,7168,2048,8,256,4,16,power_law_1.01,0.077183997631073
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,7168,2048,8,256,4,16,power_law_1.01,0.17821439504623413
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,7168,2048,8,256,4,16,power_law_1.01,0.08351359963417053
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,7168,2048,8,256,4,16,balanced,0.2744586666425069
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,7168,2048,8,256,4,16,balanced,0.12919466694196066
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,7168,2048,8,256,4,16,power_law_1.01,0.19764480590820313
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,7168,2048,8,256,4,16,power_law_1.01,0.08497920036315917
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,7168,2048,8,256,4,16,power_law_1.01,0.22856318950653076
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,7168,2048,8,256,4,16,power_law_1.01,0.08709120154380798
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,7168,2048,8,256,4,16,power_law_1.01,0.08895360231399536
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,7168,2048,8,256,4,16,power_law_1.01,0.2574912071228027
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,7168,2048,8,256,4,16,balanced,0.35715198516845703
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,7168,2048,8,256,4,16,power_law_1.01,0.08959360122680664
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,7168,2048,8,256,4,16,power_law_1.01,0.3143104076385498
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,7168,2048,8,256,4,16,power_law_1.01,0.09214720129966736
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,7168,2048,8,256,4,16,power_law_1.01,0.39743359088897706
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,7168,2048,8,256,4,16,power_law_1.01,0.09946240186691284
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,256,4,16,balanced,0.1493066648642222
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,7168,2048,8,256,4,16,power_law_1.01,0.49903359413146975
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,7168,2048,8,256,4,16,power_law_1.01,0.1063423991203308
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,7168,2048,8,256,4,16,balanced,0.4533066749572754
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,7168,2048,8,256,4,16,power_law_1.01,0.6243264198303222
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,7168,2048,8,256,4,16,power_law_1.01,0.11359360218048095
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,256,4,16,balanced,0.17410133282343546
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,7168,2048,8,256,4,16,power_law_1.01,0.11723519563674926
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,7168,2048,8,256,4,16,power_law_1.01,0.8941439628601074
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,7168,2048,8,256,4,16,balanced,1.2961333592732747
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,256,4,16,balanced,0.1902666687965393
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,7168,2048,8,256,4,16,power_law_1.01,0.12432639598846436
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,7168,2048,8,256,4,16,power_law_1.01,1.104576015472412
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,7168,2048,8,256,4,16,power_law_1.01,0.14551680088043212
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,7168,2048,8,256,4,16,power_law_1.01,1.4696063995361328
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,7168,2048,8,256,4,16,power_law_1.01,0.16117759943008422
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,256,4,16,balanced,0.24913066625595093
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,7168,2048,8,256,4,16,power_law_1.01,0.1876736044883728
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,7168,2048,8,256,4,16,balanced,0.6413173278172811
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,7168,2048,8,256,4,16,power_law_1.01,2.143987274169922
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,7168,2048,8,256,4,16,power_law_1.01,0.241811203956604
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,256,4,16,balanced,0.30180267492930096
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,7168,2048,8,256,4,16,power_law_1.01,0.2917056083679199
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,7168,2048,8,256,4,16,power_law_1.01,4.113951873779297
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,7168,2048,8,256,4,16,power_law_1.01,0.35564160346984863
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,7168,2048,8,256,4,16,power_law_1.01,0.072326397895813
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,7168,2048,8,256,4,16,power_law_1.01,0.44774398803710935
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,256,4,16,balanced,0.4492479960123698
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,7168,2048,8,256,4,16,power_law_1.01,0.09216639995574952
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,7168,2048,8,256,4,16,power_law_1.01,0.5768127918243409
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,7168,2048,8,256,4,16,power_law_1.01,0.05797119736671448
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,7168,2048,8,256,4,16,power_law_1.01,0.8286335945129395
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,7168,2048,8,256,4,16,balanced,0.8011199633280436
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,7168,2048,8,256,4,16,power_law_1.01,0.06213120222091675
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,7168,2048,8,256,4,16,power_law_1.2,0.0948095977306366
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,7168,2048,8,256,4,16,power_law_1.01,1.0912768363952636
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,7168,2048,8,256,4,16,power_law_1.01,0.06575999855995178
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,256,4,16,balanced,0.5479520161946615
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,7168,2048,8,256,4,16,power_law_1.2,0.11560319662094116
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,7168,2048,8,256,4,16,power_law_1.01,1.3741184234619142
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,7168,2048,8,256,4,16,power_law_1.01,0.0770687997341156
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,7168,2048,8,256,4,16,power_law_1.2,0.06348159909248352
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,7168,2048,8,256,4,16,power_law_1.01,0.0840511977672577
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,7168,2048,8,256,4,16,power_law_1.01,2.0743104934692385
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,7168,2048,8,256,4,16,power_law_1.2,0.07269759774208069
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,7168,2048,8,256,4,16,power_law_1.01,0.08734719753265381
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,7168,2048,8,256,4,16,power_law_1.2,0.07868160009384155
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,7168,2048,8,256,4,16,power_law_1.01,4.4990081787109375
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,7168,2048,8,256,4,16,power_law_1.01,0.08828160166740417
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,7168,2048,8,256,4,16,power_law_1.2,0.08537600040435792
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,7168,2048,8,256,4,16,power_law_1.01,0.09095039963722229
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,256,4,16,balanced,0.7948799928029379
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,7168,2048,8,256,4,16,power_law_1.2,0.11205120086669922
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,7168,2048,8,256,4,16,power_law_1.01,0.09896320104598999
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,7168,2048,8,256,4,16,balanced,1.0314079920450847
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,7168,2048,8,256,4,16,power_law_1.2,0.11352959871292115
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,7168,2048,8,256,4,16,power_law_1.01,0.09970560073852539
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,7168,2048,8,256,4,16,power_law_1.2,0.11632000207901001
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,7168,2048,8,256,4,16,power_law_1.01,0.10428800582885742
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,7168,2048,8,256,4,16,power_law_1.2,0.11887359619140625
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,7168,2048,8,256,4,16,power_law_1.01,0.11128959655761719
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,7168,2048,8,256,4,16,power_law_1.2,0.12650879621505737
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,7168,2048,8,256,4,16,power_law_1.01,0.12284159660339355
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,7168,2048,8,256,4,16,balanced,2.5537333488464355
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,7168,2048,8,256,4,16,power_law_1.01,0.12572159767150878
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,7168,2048,8,256,4,16,power_law_1.2,0.12658560276031494
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,256,4,16,balanced,1.0387519995371501
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,7168,2048,8,256,4,16,power_law_1.2,0.13304320573806763
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,7168,2048,8,256,4,16,power_law_1.01,0.1472000002861023
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,7168,2048,8,256,4,16,power_law_1.2,0.14205440282821655
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,7168,2048,8,256,4,16,power_law_1.2,1.0986623764038086
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,7168,2048,8,256,4,16,power_law_1.01,0.17345919609069824
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,7168,2048,8,256,4,16,power_law_1.2,1.3415807723999023
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,7168,2048,8,256,4,16,power_law_1.2,0.16672639846801757
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,7168,2048,8,256,4,16,balanced,1.5479200681050618
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,256,4,16,power_law_1.01,0.18019839525222778
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,7168,2048,8,256,4,16,power_law_1.2,0.19930880069732665
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,256,4,16,power_law_1.01,0.2274240016937256
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,7168,2048,8,256,4,16,power_law_1.2,0.06996480226516724
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,7168,2048,8,256,4,16,power_law_1.2,0.20655360221862792
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,256,4,16,balanced,1.2866506576538086
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,256,4,16,power_law_1.01,0.2858880043029785
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,7168,2048,8,256,4,16,power_law_1.2,0.08697599768638611
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,7168,2048,8,256,4,16,power_law_1.2,0.26177918910980225
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,7168,2048,8,256,4,16,power_law_1.2,0.05082880258560181
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,256,4,16,power_law_1.01,0.3740992069244385
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,7168,2048,8,256,4,16,power_law_1.2,0.05920640230178833
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,7168,2048,8,256,4,16,power_law_1.2,0.26440958976745604
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,7168,2048,8,256,4,16,power_law_1.2,0.06725760102272034
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,256,4,16,power_law_1.01,0.4838079929351807
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,7168,2048,8,256,4,16,power_law_1.2,0.3524159908294678
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,7168,2048,8,256,4,16,power_law_1.2,0.07120640277862549
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,7168,2048,8,256,4,16,power_law_1.2,0.08284159898757934
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,256,4,16,power_law_1.01,0.7068287849426269
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,7168,2048,8,256,4,16,power_law_1.2,0.4146304130554199
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,7168,2048,8,256,4,16,power_law_1.2,0.08402559757232667
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,7168,2048,8,256,4,16,power_law_1.2,0.5887296199798584
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,256,4,16,power_law_1.01,0.899788761138916
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,7168,2048,8,256,4,16,power_law_1.2,0.08755199909210205
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,7168,2048,8,256,4,16,power_law_1.2,0.08983039855957031
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,7168,2048,8,256,4,16,power_law_1.2,0.7414144039154053
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,256,4,16,power_law_1.01,1.2166848182678223
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,7168,2048,8,256,4,16,power_law_1.2,0.09151359796524047
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,7168,2048,8,256,4,16,power_law_1.2,1.0605952262878418
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,7168,2048,8,256,4,16,power_law_1.2,0.09449599981307984
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,256,4,16,power_law_1.01,1.701696014404297
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,7168,2048,8,256,4,16,power_law_1.2,0.10314240455627441
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,7168,2048,8,256,4,16,power_law_1.2,1.4190719604492188
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,7168,2048,8,256,4,16,power_law_1.2,0.10891519784927368
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,256,4,16,power_law_1.01,2.152288055419922
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,7168,2048,8,256,4,16,power_law_1.2,0.11729919910430908
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,7168,2048,8,256,4,16,power_law_1.2,1.888172721862793
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,7168,2048,8,256,4,16,power_law_1.2,0.13021440505981446
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,256,4,16,power_law_1.01,3.6179519653320313
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,7168,2048,8,256,4,16,power_law_1.2,0.12453759908676147
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,7168,2048,8,256,4,16,power_law_1.2,2.788467216491699
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,256,4,16,balanced,2.03330659866333
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,7168,2048,8,256,4,16,power_law_1.2,0.1471743941307068
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,256,4,16,power_law_1.01,6.6591743469238285
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,7168,2048,8,256,4,16,power_law_1.2,0.16550400257110595
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,7168,2048,8,256,4,16,power_law_1.2,0.20976641178131103
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,7168,2048,8,256,4,16,power_law_1.2,6.203417587280273
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,7168,2048,8,256,4,16,power_law_1.2,0.24681599140167237
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,7168,2048,8,256,4,16,power_law_1.2,0.33895680904388426
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,7168,2048,8,256,4,16,power_law_1.2,0.37317121028900146
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,7168,2048,8,256,4,16,power_law_1.2,0.4913856029510498
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,7168,2048,8,256,4,16,power_law_1.2,0.6664447784423828
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,7168,2048,8,256,4,16,power_law_1.2,0.9142208099365234
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,7168,2048,8,256,4,16,power_law_1.2,1.2821824073791503
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,7168,2048,8,256,4,16,power_law_1.2,1.5847104072570801
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,7168,2048,8,256,4,16,balanced,3.0755786895751953
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,7168,2048,8,256,4,16,power_law_1.2,2.5345600128173826
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,7168,2048,8,256,4,16,power_law_1.2,5.392620849609375
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,256,4,16,balanced,4.059333483378093
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,7168,2048,8,256,4,16,power_law_1.2,0.07166079878807068
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,7168,2048,8,256,4,16,power_law_1.2,0.08138239979743958
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,7168,2048,8,256,8,8,balanced,0.05628266433874766
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,7168,2048,8,256,4,16,power_law_1.2,0.052025598287582395
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,7168,2048,8,256,8,8,balanced,0.05552533268928528
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,7168,2048,8,256,4,16,power_law_1.2,0.061740797758102414
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,7168,2048,8,256,8,8,balanced,0.05844266712665558
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,7168,2048,8,256,4,16,power_law_1.2,0.06859520077705383
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,7168,2048,8,256,8,8,balanced,0.07092800239721934
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,7168,2048,8,256,4,16,power_law_1.2,0.07027199864387512
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,7168,2048,8,256,8,8,balanced,0.08959999680519104
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,7168,2048,8,256,4,16,power_law_1.2,0.08207359910011292
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,7168,2048,8,256,8,8,balanced,0.13091199596722922
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,7168,2048,8,256,8,8,balanced,0.13195733229319254
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,7168,2048,8,256,4,16,power_law_1.2,0.0824895977973938
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,7168,2048,8,256,8,8,balanced,0.13179199894269308
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,7168,2048,8,256,4,16,power_law_1.2,0.08796160221099854
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,7168,2048,8,256,8,8,balanced,0.1330453356107076
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,7168,2048,8,256,4,16,power_law_1.2,0.09211519956588746
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,7168,2048,8,256,8,8,balanced,0.13378133376439413
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,7168,2048,8,256,4,16,power_law_1.2,0.09036800265312195
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,7168,2048,8,256,8,8,balanced,0.1346879998842875
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,7168,2048,8,256,4,16,power_law_1.2,0.10333440303802491
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,7168,2048,8,256,8,8,balanced,0.1365493337313334
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,7168,2048,8,256,4,16,power_law_1.2,0.10888320207595825
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,7168,2048,8,256,8,8,balanced,0.13854400316874185
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,7168,2048,8,256,4,16,power_law_1.2,0.11348479986190796
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,7168,2048,8,256,8,8,balanced,0.1393119990825653
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,7168,2048,8,256,4,16,power_law_1.2,0.12277760505676269
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,7168,2048,8,256,8,8,balanced,0.0476800004641215
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,7168,2048,8,256,8,8,balanced,0.14451199769973755
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,7168,2048,8,256,4,16,power_law_1.2,0.13009920120239257
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,7168,2048,8,256,8,8,balanced,0.04846400022506714
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,7168,2048,8,256,8,8,balanced,0.14622933665911356
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,7168,2048,8,256,4,16,power_law_1.2,0.1602687954902649
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,7168,2048,8,256,8,8,balanced,0.049839998284975685
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,7168,2048,8,256,8,8,balanced,0.15126400192578635
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,7168,2048,8,256,8,8,balanced,0.06009600063165029
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,7168,2048,8,256,8,8,balanced,0.166101336479187
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,7168,2048,8,256,8,8,balanced,0.07237333556016286
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,7168,2048,8,256,4,16,power_law_1.2,0.17967360019683837
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,7168,2048,8,256,8,8,balanced,0.09762666622797649
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,7168,2048,8,256,8,8,balanced,0.1832853356997172
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,7168,2048,8,256,8,8,balanced,0.09889066219329834
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,7168,2048,8,256,8,8,balanced,0.09929066896438599
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,7168,2048,8,256,8,8,balanced,0.20517865816752115
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,7168,2048,8,256,8,8,balanced,0.10100266337394714
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,256,4,16,power_law_1.2,0.18617600202560425
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,7168,2048,8,256,8,8,balanced,0.10028800368309021
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,256,4,16,power_law_1.2,0.25557119846343995
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,7168,2048,8,256,8,8,balanced,0.22790932655334473
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,7168,2048,8,256,8,8,balanced,0.10321600238482158
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,256,4,16,power_law_1.2,0.3491904020309448
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,7168,2048,8,256,8,8,balanced,0.10448533296585083
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,256,4,16,power_law_1.2,0.45420160293579104
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,7168,2048,8,256,8,8,balanced,0.10642133156458537
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,7168,2048,8,256,8,8,balanced,0.2619306643803914
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,7168,2048,8,256,8,8,balanced,0.10833066701889038
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,256,4,16,power_law_1.2,0.5528063774108887
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,7168,2048,8,256,8,8,balanced,0.11601066589355469
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,256,4,16,power_law_1.2,0.8609472274780273
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,7168,2048,8,256,8,8,balanced,0.304970661799113
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,7168,2048,8,256,8,8,balanced,0.1185706655184428
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,256,4,16,power_law_1.2,1.118943977355957
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,7168,2048,8,256,8,8,balanced,0.12475732962290446
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,256,4,16,power_law_1.2,1.4238528251647948
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,7168,2048,8,256,8,8,balanced,0.13938132921854654
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,256,4,16,power_law_1.2,2.2209856033325197
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,7168,2048,8,256,8,8,balanced,0.39607465267181396
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,7168,2048,8,256,8,8,balanced,0.1583466629187266
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,256,4,16,power_law_1.2,2.399372863769531
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,7168,2048,8,256,8,8,balanced,0.18534932533899942
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,256,4,16,power_law_1.2,4.975635147094726
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,7168,2048,8,256,8,8,balanced,0.5363893508911133
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,7168,2048,8,256,8,8,balanced,0.2097439964612325
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,256,4,16,power_law_1.2,9.44417953491211
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,7168,2048,8,256,8,8,power_law_1.01,0.07025279998779296
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,7168,2048,8,256,8,8,balanced,0.26124799251556396
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,7168,2048,8,256,8,8,power_law_1.01,0.09367679953575134
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,7168,2048,8,256,8,8,balanced,0.31364800532658893
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,7168,2048,8,256,8,8,power_law_1.01,0.06495360136032105
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,7168,2048,8,256,8,8,balanced,0.7637226581573486
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,7168,2048,8,256,8,8,power_law_1.01,0.06995199918746949
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,7168,2048,8,256,8,8,power_law_1.01,0.08401920199394226
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,7168,2048,8,256,8,8,balanced,0.42714134852091473
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,7168,2048,8,256,8,8,power_law_1.01,0.08753920197486878
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,7168,2048,8,256,8,8,power_law_1.01,0.05658239722251892
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,7168,2048,8,256,8,8,balanced,0.047637333472569786
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,7168,2048,8,256,8,8,power_law_1.01,0.1133504033088684
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,7168,2048,8,256,8,8,balanced,0.050517335534095764
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,7168,2048,8,256,8,8,power_law_1.01,0.07109119892120361
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,7168,2048,8,256,8,8,power_law_1.01,0.11171200275421142
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,7168,2048,8,256,8,8,balanced,0.05273599922657013
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,7168,2048,8,256,8,8,power_law_1.01,0.06462079882621766
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,7168,2048,8,256,8,8,power_law_1.01,0.05613440275192261
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,7168,2048,8,256,8,8,power_law_1.01,0.11851520538330078
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,7168,2048,8,256,8,8,balanced,0.9054826895395914
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,7168,2048,8,256,8,8,balanced,0.5656960010528564
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,7168,2048,8,256,8,8,balanced,0.0650186687707901
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,7168,2048,8,256,8,8,power_law_1.01,0.060096001625061034
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,7168,2048,8,256,8,8,power_law_1.01,0.07712000012397766
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,7168,2048,8,256,8,8,power_law_1.01,0.12314239740371705
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,7168,2048,8,256,8,8,balanced,0.07641066610813141
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,7168,2048,8,256,8,8,power_law_1.01,0.06887680292129517
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,7168,2048,8,256,8,8,power_law_1.01,0.06030719876289368
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,7168,2048,8,256,8,8,power_law_1.01,0.12896640300750734
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,7168,2048,8,256,8,8,balanced,0.10108799735705058
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,7168,2048,8,256,8,8,power_law_1.01,0.07365120053291321
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,7168,2048,8,256,8,8,power_law_1.01,0.06775040030479432
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,7168,2048,8,256,8,8,power_law_1.01,0.12832640409469603
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,7168,2048,8,256,8,8,balanced,0.103493332862854
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,7168,2048,8,256,8,8,power_law_1.01,0.07308800220489502
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,7168,2048,8,256,8,8,power_law_1.01,0.08427519798278808
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,7168,2048,8,256,8,8,balanced,0.10502933462460835
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,7168,2048,8,256,8,8,power_law_1.01,0.1369472026824951
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,7168,2048,8,256,8,8,power_law_1.01,0.08105599880218506
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,7168,2048,8,256,8,8,power_law_1.01,0.09007359743118286
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,7168,2048,8,256,8,8,balanced,0.10582933823267619
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,7168,2048,8,256,8,8,power_law_1.01,0.14621440172195435
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,7168,2048,8,256,8,8,balanced,0.8206666310628256
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,7168,2048,8,256,8,8,power_law_1.01,0.09316480159759521
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,7168,2048,8,256,8,8,balanced,0.1072213351726532
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,7168,2048,8,256,8,8,power_law_1.01,0.09037439823150635
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,7168,2048,8,256,8,8,power_law_1.01,0.15791360139846802
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,7168,2048,8,256,8,8,power_law_1.01,0.09457280039787293
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,7168,2048,8,256,8,8,balanced,0.10899200042088826
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,7168,2048,8,256,8,8,power_law_1.01,0.0917952001094818
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,7168,2048,8,256,8,8,balanced,1.1698559919993083
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,7168,2048,8,256,8,8,power_law_1.01,1.1064831733703613
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,7168,2048,8,256,8,8,power_law_1.01,0.09893760085105896
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,7168,2048,8,256,8,8,balanced,0.1109920044740041
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,7168,2048,8,256,8,8,power_law_1.2,0.07004799842834472
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,7168,2048,8,256,8,8,power_law_1.01,0.09523839950561523
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,7168,2048,8,256,8,8,power_law_1.01,1.3534784317016602
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,7168,2048,8,256,8,8,power_law_1.01,0.10060160160064698
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,7168,2048,8,256,8,8,balanced,0.1144426663716634
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,7168,2048,8,256,8,8,power_law_1.2,0.09059839844703674
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,7168,2048,8,256,8,8,power_law_1.01,0.09742079973220825
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,7168,2048,8,256,8,8,power_law_1.01,1.390329647064209
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,7168,2048,8,256,8,8,power_law_1.2,0.06495360136032105
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,7168,2048,8,256,8,8,power_law_1.01,0.10392320156097412
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,7168,2048,8,256,8,8,balanced,0.11674666404724121
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,7168,2048,8,256,8,8,power_law_1.01,0.10528639554977418
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,7168,2048,8,256,8,8,power_law_1.2,0.06944640278816223
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,7168,2048,8,256,8,8,power_law_1.01,0.11787519454956055
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,7168,2048,8,256,8,8,power_law_1.01,0.2029439926147461
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,7168,2048,8,256,8,8,balanced,0.12451199690500896
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,7168,2048,8,256,8,8,power_law_1.2,0.07660160064697266
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,7168,2048,8,256,8,8,power_law_1.01,0.1126207947731018
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,7168,2048,8,256,8,8,power_law_1.01,0.12035200595855713
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,7168,2048,8,256,8,8,balanced,1.007263978322347
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,7168,2048,8,256,8,8,power_law_1.2,0.08718079924583436
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,7168,2048,8,256,8,8,power_law_1.01,0.2381119966506958
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,7168,2048,8,256,8,8,balanced,0.12895466883977255
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,7168,2048,8,256,8,8,power_law_1.2,0.1102720022201538
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,7168,2048,8,256,8,8,power_law_1.01,0.13071999549865723
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,7168,2048,8,256,8,8,power_law_1.01,0.12439039945602418
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,7168,2048,8,256,8,8,power_law_1.01,0.2886143922805786
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,7168,2048,8,256,8,8,power_law_1.2,0.11345280408859253
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,7168,2048,8,256,8,8,balanced,0.135535995165507
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,7168,2048,8,256,8,8,power_law_1.01,0.14263039827346802
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,7168,2048,8,256,8,8,power_law_1.2,0.11534719467163086
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,7168,2048,8,256,8,8,power_law_1.01,0.13160959482192994
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,7168,2048,8,256,8,8,power_law_1.01,0.3244287967681885
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,7168,2048,8,256,8,8,power_law_1.2,0.11447679996490479
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,7168,2048,8,256,8,8,power_law_1.01,0.1513152003288269
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,7168,2048,8,256,8,8,power_law_1.01,0.13381760120391845
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,7168,2048,8,256,8,8,power_law_1.01,0.41515522003173827
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,7168,2048,8,256,8,8,power_law_1.2,0.13041919469833374
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,7168,2048,8,256,8,8,power_law_1.01,0.16911360025405883
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,7168,2048,8,256,8,8,power_law_1.2,0.1314560055732727
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,7168,2048,8,256,8,8,power_law_1.01,0.15363839864730836
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,7168,2048,8,256,8,8,power_law_1.01,0.5210303783416748
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,7168,2048,8,256,8,8,power_law_1.2,0.13492480516433716
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,7168,2048,8,256,8,8,balanced,0.158869336048762
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,7168,2048,8,256,8,8,power_law_1.01,0.1744320034980774
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,7168,2048,8,256,8,8,power_law_1.01,0.6709184169769287
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,7168,2048,8,256,8,8,power_law_1.2,0.1484544038772583
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,7168,2048,8,256,8,8,power_law_1.2,1.1015104293823241
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,7168,2048,8,256,8,8,power_law_1.01,0.2121920108795166
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,7168,2048,8,256,8,8,power_law_1.01,0.21184000968933106
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,7168,2048,8,256,8,8,power_law_1.01,0.9747008323669434
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,7168,2048,8,256,8,8,balanced,1.6191253662109375
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,7168,2048,8,256,8,8,power_law_1.2,1.3502911567687987
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,7168,2048,8,256,8,8,power_law_1.01,0.2556096076965332
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,7168,2048,8,256,8,8,power_law_1.01,1.1625791549682618
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,7168,2048,8,256,8,8,power_law_1.2,1.354751968383789
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,7168,2048,8,256,8,8,balanced,1.2940586407979329
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,7168,2048,8,256,8,8,power_law_1.2,1.3901375770568847
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,7168,2048,8,256,8,8,power_law_1.01,0.3097343921661377
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,7168,2048,8,256,8,8,power_law_1.01,1.4684351921081542
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,7168,2048,8,256,8,8,power_law_1.2,0.21303679943084716
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,7168,2048,8,256,8,8,power_law_1.01,0.3736704111099243
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,7168,2048,8,256,8,8,power_law_1.2,0.2452415943145752
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,7168,2048,8,256,8,8,power_law_1.01,2.2133312225341797
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,256,8,8,power_law_1.01,0.22200319766998292
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,256,8,8,balanced,0.18781866629918417
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,7168,2048,8,256,8,8,power_law_1.2,0.2803328037261963
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,7168,2048,8,256,8,8,power_law_1.01,0.532096004486084
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,256,8,8,power_law_1.01,0.28323841094970703
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,7168,2048,8,256,8,8,power_law_1.2,0.3913664102554321
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,7168,2048,8,256,8,8,power_law_1.01,0.6841407775878906
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,256,8,8,balanced,0.22883733113606772
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,7168,2048,8,256,8,8,power_law_1.01,4.623980712890625
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,7168,2048,8,256,8,8,power_law_1.2,0.4332479953765869
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,256,8,8,power_law_1.01,0.3649215936660767
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,7168,2048,8,256,8,8,power_law_1.01,0.9917632102966308
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,7168,2048,8,256,8,8,power_law_1.2,0.6338367938995362
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,256,8,8,power_law_1.01,0.49045758247375487
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,256,8,8,balanced,0.2632373372713725
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,7168,2048,8,256,8,8,power_law_1.2,0.6905792236328125
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,7168,2048,8,256,8,8,power_law_1.01,1.243558406829834
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,256,8,8,power_law_1.01,0.5816512107849121
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,7168,2048,8,256,8,8,power_law_1.2,1.0895423889160156
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,7168,2048,8,256,8,8,power_law_1.2,1.2973695755004884
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,7168,2048,8,256,8,8,power_law_1.01,1.5208767890930175
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,256,8,8,power_law_1.01,0.9056192398071289
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,256,8,8,balanced,0.3723893165588379
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,7168,2048,8,256,8,8,power_law_1.2,1.6026687622070312
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,256,8,8,power_law_1.01,1.1985983848571777
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,7168,2048,8,256,8,8,power_law_1.01,2.509619140625
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,7168,2048,8,256,8,8,power_law_1.2,2.527507209777832
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,256,8,8,power_law_1.01,1.6756351470947266
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,256,8,8,balanced,0.4447893301645915
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,7168,2048,8,256,8,8,power_law_1.01,4.762124633789062
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,7168,2048,8,256,8,8,power_law_1.2,6.101766586303711
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,256,8,8,power_law_1.01,2.1639936447143553
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,7168,2048,8,256,8,8,balanced,1.9192372957865398
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,256,8,8,power_law_1.01,2.7026880264282225
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,256,8,8,balanced,0.6685813268025717
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,256,8,8,power_law_1.01,4.213996887207031
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,256,8,8,power_law_1.01,8.38529281616211
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,256,8,8,balanced,0.82424529393514
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,7168,2048,8,256,8,8,balanced,3.2029546101888022
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,256,8,8,balanced,1.1933706601460774
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,256,8,8,balanced,1.5565759340922039
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,7168,2048,8,256,8,8,balanced,3.739018758138021
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,7168,2048,8,256,8,8,power_law_1.2,0.05324800014495849
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,7168,2048,8,256,8,8,power_law_1.2,0.06442880034446716
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,7168,2048,8,256,8,8,power_law_1.2,0.050246399641036985
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,256,8,8,balanced,1.9335360527038574
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,7168,2048,8,256,8,8,power_law_1.2,0.057708799839019775
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,7168,2048,8,256,8,8,power_law_1.2,0.06565759778022766
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,7168,2048,8,256,8,8,power_law_1.2,0.075135999917984
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,7168,2048,8,256,8,8,power_law_1.2,0.08725759983062745
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,7168,2048,8,256,8,8,power_law_1.2,0.08985599875450134
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,7168,2048,8,256,8,8,power_law_1.2,0.0876416027545929
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,7168,2048,8,256,8,8,power_law_1.2,0.08936960101127625
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,7168,2048,8,256,8,8,power_law_1.2,0.09534080028533935
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,7168,2048,8,256,8,8,power_law_1.2,0.09964799880981445
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,7168,2048,8,256,8,8,power_law_1.2,0.10126719474792481
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,7168,2048,8,256,8,8,power_law_1.2,0.11416319608688355
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,256,8,8,balanced,3.0555413564046225
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,7168,2048,8,256,8,8,power_law_1.2,0.12728960514068605
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,7168,2048,8,256,8,8,power_law_1.2,0.1335360050201416
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,7168,2048,8,256,8,8,power_law_1.2,0.13662079572677613
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,7168,2048,8,256,8,8,power_law_1.2,0.15829119682312012
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,7168,2048,8,256,8,8,power_law_1.2,0.1815551996231079
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,7168,2048,8,256,8,8,power_law_1.2,0.21910400390625
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,7168,2048,8,256,8,8,power_law_1.2,0.272761607170105
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,7168,2048,8,256,8,8,power_law_1.2,0.3241919994354248
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,7168,2048,8,256,8,8,power_law_1.2,0.3801984071731567
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,7168,2048,8,256,8,8,power_law_1.2,0.5300543785095215
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,7168,2048,8,256,8,8,power_law_1.2,0.7299392223358154
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,7168,2048,8,256,8,8,power_law_1.2,1.094809627532959
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,7168,2048,8,256,8,8,power_law_1.2,1.372377586364746
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,7168,2048,8,256,8,8,power_law_1.2,1.6301824569702148
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,7168,2048,8,256,8,8,power_law_1.2,2.8358911514282226
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,7168,2048,8,256,8,8,power_law_1.2,5.66572151184082
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,256,8,8,balanced,6.10321044921875
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,7168,2048,8,256,8,8,power_law_1.2,0.06442239880561829
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,7168,2048,8,256,8,8,power_law_1.2,0.07619199752807618
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,7168,2048,8,256,8,8,power_law_1.2,0.05511680245399475
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,7168,2048,8,256,8,8,power_law_1.2,0.0644864022731781
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,7168,2048,8,256,8,8,power_law_1.2,0.07203840017318726
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,7168,2048,8,256,16,4,balanced,0.04841066896915436
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,7168,2048,8,256,8,8,power_law_1.2,0.0762112021446228
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,7168,2048,8,256,16,4,balanced,0.05563200016816457
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,7168,2048,8,256,16,4,balanced,0.05041066805521647
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,7168,2048,8,256,8,8,power_law_1.2,0.09386879801750184
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,7168,2048,8,256,16,4,balanced,0.05707733333110809
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,7168,2048,8,256,16,4,balanced,0.05264000097910563
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,7168,2048,8,256,8,8,power_law_1.2,0.09749760031700135
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,7168,2048,8,256,16,4,balanced,0.062122667829195656
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,7168,2048,8,256,16,4,balanced,0.061706667145093284
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,7168,2048,8,256,16,4,balanced,0.08066666622956593
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,7168,2048,8,256,8,8,power_law_1.2,0.0985472023487091
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,7168,2048,8,256,16,4,balanced,0.07407466570536296
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,7168,2048,8,256,16,4,power_law_1.01,0.05885440111160278
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,7168,2048,8,256,16,4,balanced,0.11358933647473653
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,7168,2048,8,256,8,8,power_law_1.2,0.10314879417419434
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,7168,2048,8,256,16,4,balanced,0.09737066427866618
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,7168,2048,8,256,16,4,balanced,0.05805333455403646
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,7168,2048,8,256,16,4,balanced,0.11566399534543355
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,7168,2048,8,256,16,4,power_law_1.01,0.07470080256462097
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,7168,2048,8,256,8,8,power_law_1.2,0.10711040496826171
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,7168,2048,8,256,16,4,balanced,0.14537066221237183
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,7168,2048,8,256,16,4,balanced,0.11588799953460693
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,7168,2048,8,256,16,4,balanced,0.06197333335876465
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,7168,2048,8,256,16,4,power_law_1.01,0.06314880251884461
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,7168,2048,8,256,16,4,balanced,0.14693333705266318
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,7168,2048,8,256,8,8,power_law_1.2,0.11278719902038574
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,7168,2048,8,256,16,4,balanced,0.11705066760381062
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,7168,2048,8,256,16,4,balanced,0.06571733454863231
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,7168,2048,8,256,16,4,power_law_1.01,0.07094399929046631
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,7168,2048,8,256,16,4,balanced,0.14594667156537375
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,7168,2048,8,256,8,8,power_law_1.2,0.11978880167007447
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,7168,2048,8,256,16,4,balanced,0.11761066317558289
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,7168,2048,8,256,16,4,balanced,0.07646400233109792
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,7168,2048,8,256,16,4,power_law_1.01,0.0813696026802063
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,7168,2048,8,256,16,4,balanced,0.14668800433476767
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,7168,2048,8,256,8,8,power_law_1.2,0.12929919958114625
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,7168,2048,8,256,16,4,balanced,0.11932800213495891
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,7168,2048,8,256,16,4,balanced,0.09526933232943217
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,7168,2048,8,256,16,4,power_law_1.01,0.09938560128211975
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,7168,2048,8,256,16,4,balanced,0.1486240029335022
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,7168,2048,8,256,16,4,balanced,0.12204266587893169
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,7168,2048,8,256,8,8,power_law_1.2,0.14445439577102662
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,7168,2048,8,256,16,4,balanced,0.1304586629072825
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,7168,2048,8,256,16,4,balanced,0.15110933780670166
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,7168,2048,8,256,16,4,power_law_1.01,0.11689599752426147
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,7168,2048,8,256,16,4,balanced,0.1251306633154551
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,7168,2048,8,256,8,8,power_law_1.2,0.15117440223693848
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,7168,2048,8,256,16,4,balanced,0.1308746635913849
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,7168,2048,8,256,16,4,balanced,0.1534773310025533
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,7168,2048,8,256,16,4,power_law_1.01,0.1242624044418335
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,7168,2048,8,256,16,4,balanced,0.12754666805267334
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,7168,2048,8,256,16,4,balanced,0.13251200318336487
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,7168,2048,8,256,8,8,power_law_1.2,0.17725440263748168
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,7168,2048,8,256,16,4,power_law_1.01,0.1286080002784729
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,7168,2048,8,256,16,4,balanced,0.15517333149909973
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,7168,2048,8,256,16,4,balanced,0.13546133041381836
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,7168,2048,8,256,16,4,balanced,0.13539200027783713
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,7168,2048,8,256,16,4,power_law_1.01,0.12900480031967163
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,7168,2048,8,256,16,4,balanced,0.16146666804949442
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,7168,2048,8,256,16,4,balanced,0.1365226705869039
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,7168,2048,8,256,16,4,balanced,0.1371946632862091
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,7168,2048,8,256,8,8,power_law_1.2,0.2062079906463623
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,7168,2048,8,256,16,4,power_law_1.01,0.13848960399627686
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,7168,2048,8,256,16,4,balanced,0.16682666540145874
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,7168,2048,8,256,16,4,balanced,0.1397760013739268
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,7168,2048,8,256,16,4,balanced,0.14672533671061197
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,7168,2048,8,256,16,4,power_law_1.01,0.14406399726867675
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,7168,2048,8,256,16,4,balanced,0.14482667048772177
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,7168,2048,8,256,16,4,balanced,0.16906134287516275
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,7168,2048,8,256,16,4,balanced,0.16887466112772623
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,256,8,8,power_law_1.2,0.23255040645599365
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,7168,2048,8,256,16,4,power_law_1.01,0.1460479974746704
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,7168,2048,8,256,16,4,balanced,0.14872533082962036
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,7168,2048,8,256,16,4,balanced,0.17529600858688354
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,7168,2048,8,256,16,4,balanced,0.193231999874115
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,7168,2048,8,256,16,4,balanced,0.15588800112406412
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,7168,2048,8,256,16,4,power_law_1.01,0.17416319847106934
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,256,8,8,power_law_1.2,0.3012991905212402
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,7168,2048,8,256,16,4,balanced,0.19450666507085165
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,7168,2048,8,256,16,4,balanced,0.16818133989969888
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,7168,2048,8,256,16,4,balanced,0.22499199708302817
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,256,8,8,power_law_1.2,0.37959039211273193
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,7168,2048,8,256,16,4,power_law_1.01,0.18457599878311157
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,7168,2048,8,256,16,4,balanced,0.17458132902781168
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,7168,2048,8,256,16,4,balanced,0.21518399318059286
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,256,8,8,power_law_1.2,0.5888639926910401
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,7168,2048,8,256,16,4,power_law_1.01,0.19459840059280395
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,7168,2048,8,256,16,4,balanced,0.25755733251571655
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,7168,2048,8,256,16,4,balanced,0.18247467279434204
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,256,8,8,power_law_1.2,0.7822527885437012
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,7168,2048,8,256,16,4,balanced,0.2507359981536865
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,7168,2048,8,256,16,4,power_law_1.01,1.3752960205078124
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,256,8,8,power_law_1.2,0.9512831687927246
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,7168,2048,8,256,16,4,power_law_1.01,1.4192704200744628
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,7168,2048,8,256,16,4,balanced,0.3291253248850505
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,7168,2048,8,256,16,4,balanced,0.2704373399416606
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,256,8,8,power_law_1.2,1.3673088073730468
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,7168,2048,8,256,16,4,power_law_1.01,1.452883243560791
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,7168,2048,8,256,16,4,power_law_1.01,0.05169919729232788
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,7168,2048,8,256,16,4,balanced,0.22032533089319864
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,256,8,8,power_law_1.2,1.7713727951049805
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,7168,2048,8,256,16,4,power_law_1.01,2.233196830749512
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,7168,2048,8,256,16,4,balanced,0.33340267340342206
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,7168,2048,8,256,16,4,power_law_1.01,0.061388802528381345
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,7168,2048,8,256,16,4,balanced,0.4081919987996419
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,7168,2048,8,256,16,4,power_law_1.01,0.31928319931030275
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,7168,2048,8,256,16,4,power_law_1.01,0.05370879769325256
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,256,8,8,power_law_1.2,2.6073408126831055
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,7168,2048,8,256,16,4,power_law_1.01,0.3880896091461182
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,7168,2048,8,256,16,4,power_law_1.01,0.062636798620224
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,7168,2048,8,256,16,4,balanced,0.4036906560262044
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,256,8,8,power_law_1.2,3.4277313232421873
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,7168,2048,8,256,16,4,balanced,0.5737760066986084
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,7168,2048,8,256,16,4,power_law_1.01,0.5333759784698486
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,7168,2048,8,256,16,4,power_law_1.01,0.07187839746475219
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,256,8,8,power_law_1.2,4.95807991027832
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,256,16,4,balanced,0.2824853261311849
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,7168,2048,8,256,16,4,power_law_1.01,0.6749440193176269
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,7168,2048,8,256,16,4,power_law_1.01,0.08264319896697998
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,7168,2048,8,256,16,4,power_law_1.01,0.0955839991569519
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,7168,2048,8,256,16,4,power_law_1.01,0.7902207851409913
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,7168,2048,8,256,16,4,balanced,0.5484586556752523
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,256,16,4,balanced,0.370527982711792
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,256,8,8,power_law_1.2,10.712646484375
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,7168,2048,8,256,16,4,power_law_1.01,0.10481280088424683
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,7168,2048,8,256,16,4,balanced,0.7438826560974121
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,7168,2048,8,256,16,4,power_law_1.01,1.1401856422424317
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,256,16,4,balanced,0.41577601432800293
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,7168,2048,8,256,16,4,power_law_1.01,0.10151040554046631
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,7168,2048,8,256,16,4,power_law_1.01,1.5401535987854005
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,7168,2048,8,256,16,4,power_law_1.01,0.10377600193023681
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,7168,2048,8,256,16,4,power_law_1.01,1.8784320831298829
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,256,16,4,balanced,0.5946293274561564
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,7168,2048,8,256,16,4,balanced,0.6898187001546224
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,7168,2048,8,256,16,4,power_law_1.01,0.10940159559249878
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,7168,2048,8,256,16,4,power_law_1.01,0.11347839832305909
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,7168,2048,8,256,16,4,power_law_1.01,2.818751907348633
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,256,16,4,balanced,0.7117013136545817
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,7168,2048,8,256,16,4,balanced,1.0707039833068848
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,7168,2048,8,256,16,4,power_law_1.01,0.11818239688873292
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,7168,2048,8,256,16,4,power_law_1.01,5.696831893920899
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,7168,2048,8,256,16,4,power_law_1.01,0.13140480518341063
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,7168,2048,8,256,16,4,power_law_1.01,0.13882880210876464
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,7168,2048,8,256,16,4,balanced,0.9853493372599283
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,256,16,4,balanced,1.0881333351135254
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,7168,2048,8,256,16,4,power_law_1.01,0.14856959581375123
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,7168,2048,8,256,16,4,power_law_1.01,0.15370240211486816
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,7168,2048,8,256,16,4,power_law_1.01,0.18856960535049438
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,7168,2048,8,256,16,4,balanced,1.3320159912109375
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,256,16,4,balanced,1.3459839820861816
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,7168,2048,8,256,16,4,power_law_1.01,0.2065216064453125
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,7168,2048,8,256,16,4,power_law_1.01,0.2529536008834839
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,7168,2048,8,256,16,4,power_law_1.01,0.2990976095199585
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,7168,2048,8,256,16,4,balanced,1.2133173147837322
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,7168,2048,8,256,16,4,power_law_1.01,0.3836927890777588
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,7168,2048,8,256,16,4,power_law_1.01,0.47574400901794434
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,256,16,4,balanced,1.9823946952819824
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,7168,2048,8,256,16,4,power_law_1.01,0.6673088073730469
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,7168,2048,8,256,16,4,power_law_1.01,0.8380096435546875
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,7168,2048,8,256,16,4,balanced,1.724954605102539
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,7168,2048,8,256,16,4,power_law_1.01,1.2292736053466797
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,7168,2048,8,256,16,4,power_law_1.01,0.06720640063285828
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,7168,2048,8,256,16,4,power_law_1.01,1.4650560379028321
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,7168,2048,8,256,16,4,power_law_1.01,0.07491199970245362
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,7168,2048,8,256,16,4,power_law_1.01,1.922982406616211
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,7168,2048,8,256,16,4,power_law_1.01,0.06812800168991089
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,7168,2048,8,256,16,4,balanced,1.5770400365193684
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,256,16,4,balanced,2.608272075653076
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,7168,2048,8,256,16,4,power_law_1.01,0.07797759771347046
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,7168,2048,8,256,16,4,power_law_1.01,3.2576961517333984
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,7168,2048,8,256,16,4,power_law_1.01,0.08702719807624817
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,7168,2048,8,256,16,4,power_law_1.01,6.138111877441406
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,7168,2048,8,256,16,4,power_law_1.01,0.09923840165138245
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,7168,2048,8,256,16,4,power_law_1.01,0.11568640470504761
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,7168,2048,8,256,16,4,power_law_1.01,0.12124160528182984
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,7168,2048,8,256,16,4,power_law_1.01,0.12392319440841675
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,7168,2048,8,256,16,4,power_law_1.01,0.12830079793930055
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,7168,2048,8,256,16,4,power_law_1.01,0.13649280071258546
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,256,16,4,balanced,3.2361119588216147
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,7168,2048,8,256,16,4,power_law_1.2,0.058847999572753905
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,7168,2048,8,256,16,4,balanced,2.5777014096577964
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,7168,2048,8,256,16,4,power_law_1.01,0.14531199932098388
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,7168,2048,8,256,16,4,power_law_1.2,0.07475839853286743
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,7168,2048,8,256,16,4,power_law_1.01,0.1519744038581848
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,7168,2048,8,256,16,4,power_law_1.2,0.060249602794647215
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,7168,2048,8,256,16,4,power_law_1.01,0.1696320056915283
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,7168,2048,8,256,16,4,power_law_1.2,0.06938239932060242
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,7168,2048,8,256,16,4,power_law_1.01,0.18387839794158936
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,7168,2048,8,256,16,4,power_law_1.2,0.07898880243301391
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,7168,2048,8,256,16,4,balanced,2.333733399709066
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,7168,2048,8,256,16,4,power_law_1.2,0.09412479996681214
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,7168,2048,8,256,16,4,power_law_1.01,0.19483519792556764
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,7168,2048,8,256,16,4,power_law_1.2,0.11466879844665527
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,7168,2048,8,256,16,4,power_law_1.01,0.22958719730377197
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,7168,2048,8,256,16,4,power_law_1.2,0.12416000366210937
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,7168,2048,8,256,16,4,power_law_1.2,0.12458879947662353
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,7168,2048,8,256,16,4,power_law_1.2,0.13159040212631226
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,7168,2048,8,256,16,4,power_law_1.01,0.2846208095550537
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,7168,2048,8,256,16,4,power_law_1.2,0.13829760551452636
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,7168,2048,8,256,16,4,power_law_1.2,0.14732160568237304
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,7168,2048,8,256,16,4,power_law_1.2,0.15406080484390258
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,7168,2048,8,256,16,4,power_law_1.2,0.1725759983062744
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,256,16,4,power_law_1.01,0.3372096061706543
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,256,16,4,balanced,5.11683718363444
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,7168,2048,8,256,16,4,power_law_1.2,0.1813055992126465
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,256,16,4,power_law_1.01,0.4248960018157959
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,7168,2048,8,256,16,4,power_law_1.2,0.18781440258026122
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,7168,2048,8,256,16,4,power_law_1.2,1.3884032249450684
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,256,16,4,power_law_1.01,0.5382207870483399
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,7168,2048,8,256,16,4,power_law_1.2,1.4375871658325194
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,256,16,4,power_law_1.01,0.7210815906524658
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,7168,2048,8,256,16,4,power_law_1.2,1.9364992141723634
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,256,16,4,power_law_1.01,0.9001472473144532
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,7168,2048,8,256,16,4,power_law_1.2,2.0066560745239257
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,256,16,4,power_law_1.01,1.3143551826477051
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,7168,2048,8,256,16,4,power_law_1.2,0.32953600883483886
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,256,16,4,power_law_1.01,1.633843231201172
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,7168,2048,8,256,16,4,power_law_1.2,0.401632022857666
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,256,16,4,power_law_1.01,2.4559232711791994
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,7168,2048,8,256,16,4,power_law_1.2,0.5717887878417969
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,256,16,4,power_law_1.01,3.30882568359375
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,7168,2048,8,256,16,4,power_law_1.2,0.7131711959838867
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,256,16,4,power_law_1.01,3.902048110961914
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,7168,2048,8,256,16,4,power_law_1.2,0.8601984024047852
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,7168,2048,8,256,16,4,power_law_1.2,1.1931776046752929
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,256,16,4,power_law_1.01,6.4178108215332035
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,7168,2048,8,256,16,4,power_law_1.2,1.4959551811218261
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,7168,2048,8,256,16,4,power_law_1.2,1.9060096740722656
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,7168,2048,8,256,16,4,balanced,5.108415921529134
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,256,16,4,power_law_1.01,13.236256408691407
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,7168,2048,8,256,16,4,power_law_1.2,3.533651351928711
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,7168,2048,8,256,16,4,power_law_1.2,6.650323486328125
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,7168,2048,8,256,16,4,balanced,4.556069374084473
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,256,16,4,balanced,10.1876589457194
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,7168,2048,8,256,16,4,power_law_1.2,0.05134720206260681
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,7168,2048,8,256,16,4,power_law_1.2,0.059564799070358276
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,7168,2048,8,256,16,4,power_law_1.2,0.05326719880104065
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,7168,2048,8,256,16,4,power_law_1.2,0.06116480231285095
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,7168,2048,8,256,16,4,power_law_1.2,0.06949120163917541
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,7168,2048,8,256,16,4,power_law_1.2,0.07822080254554749
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,7168,2048,8,256,16,4,power_law_1.2,0.09662079811096191
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,7168,2048,8,256,16,4,power_law_1.2,0.09776639938354492
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,7168,2048,8,256,16,4,power_law_1.2,0.10093439817428589
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,7168,2048,8,256,16,4,power_law_1.2,0.06718080043792725
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,7168,2048,8,256,16,4,power_law_1.2,0.10368640422821045
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,7168,2048,8,256,16,4,power_law_1.2,0.07500799894332885
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,7168,2048,8,256,16,4,power_law_1.2,0.11062400341033936
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,7168,2048,8,256,16,4,power_law_1.2,0.06840959787368775
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,7168,2048,8,256,16,4,power_law_1.2,0.11522560119628907
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,7168,2048,8,256,16,4,power_law_1.2,0.07760639786720276
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,7168,2048,8,256,16,4,power_law_1.2,0.12225279808044434
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,7168,2048,8,256,16,4,power_law_1.2,0.08402559757232667
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,7168,2048,8,256,16,4,power_law_1.2,0.13256959915161132
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,7168,2048,8,256,16,4,power_law_1.2,0.09472000002861022
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,7168,2048,8,256,16,4,power_law_1.2,0.14188159704208375
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,7168,2048,8,256,16,4,power_law_1.2,0.11029119491577148
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,7168,2048,8,256,16,4,power_law_1.2,0.15461119413375854
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,7168,2048,8,256,16,4,power_law_1.2,0.11667200326919555
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,7168,2048,8,256,16,4,power_law_1.2,0.16539520025253296
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,7168,2048,8,256,16,4,power_law_1.2,0.1221119999885559
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,7168,2048,8,256,16,4,power_law_1.2,0.1953727960586548
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,7168,2048,8,256,16,4,power_law_1.2,0.12584960460662842
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,7168,2048,8,256,16,4,power_law_1.2,0.2205631971359253
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,7168,2048,8,256,16,4,power_law_1.2,0.13600000143051147
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,7168,2048,8,256,16,4,power_law_1.2,0.2601344108581543
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,7168,2048,8,256,16,4,power_law_1.2,0.14595839977264405
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,7168,2048,8,256,16,4,power_law_1.2,0.3083008050918579
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,7168,2048,8,256,16,4,power_law_1.2,0.15383679866790773
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,7168,2048,8,256,16,4,power_law_1.2,0.38399999141693114
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,7168,2048,8,256,16,4,power_law_1.2,0.17381759881973266
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,7168,2048,8,256,32,2,balanced,0.05805333455403646
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,7168,2048,8,256,16,4,power_law_1.2,0.5062848091125488
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,7168,2048,8,256,16,4,power_law_1.2,0.18417919874191285
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,7168,2048,8,256,32,2,balanced,0.059605335195859276
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,7168,2048,8,256,16,4,power_law_1.2,0.6549568176269531
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,7168,2048,8,256,32,2,balanced,0.0757013310988744
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,7168,2048,8,256,16,4,power_law_1.2,0.1966912031173706
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,7168,2048,8,256,32,2,balanced,0.09303999940554301
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,7168,2048,8,256,16,4,power_law_1.2,0.9319168090820312
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,7168,2048,8,256,16,4,power_law_1.2,0.22750720977783204
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,7168,2048,8,256,32,2,balanced,0.12339733044306438
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,7168,2048,8,256,32,2,balanced,0.1755626598993937
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,7168,2048,8,256,16,4,power_law_1.2,1.214367961883545
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,7168,2048,8,256,32,2,balanced,0.1774133245150248
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,7168,2048,8,256,32,2,balanced,0.16972267627716064
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,7168,2048,8,256,16,4,power_law_1.2,0.29558401107788085
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,7168,2048,8,256,16,4,power_law_1.2,1.6216384887695312
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,7168,2048,8,256,32,2,balanced,0.17101866006851196
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,7168,2048,8,256,32,2,balanced,0.17136534055074057
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,7168,2048,8,256,16,4,power_law_1.2,2.0899328231811523
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,7168,2048,8,256,32,2,balanced,0.17522132396697998
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,7168,2048,8,256,32,2,balanced,0.17851199706395468
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,256,16,4,power_law_1.2,0.3339967966079712
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,7168,2048,8,256,16,4,power_law_1.2,3.2253887176513674
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,7168,2048,8,256,32,2,balanced,0.18056533734003702
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,7168,2048,8,256,32,2,balanced,0.18526933590571085
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,256,16,4,power_law_1.2,0.44040961265563966
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,7168,2048,8,256,32,2,balanced,0.19353600343068442
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,7168,2048,8,256,16,4,power_law_1.2,6.995327758789062
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,256,16,4,power_law_1.2,0.5485888004302979
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,7168,2048,8,256,32,2,balanced,0.19867199659347534
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,256,16,4,power_law_1.2,0.7762879848480224
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,7168,2048,8,256,32,2,balanced,0.20645334323247275
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,256,16,4,power_law_1.2,1.0125951766967773
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,7168,2048,8,256,32,2,balanced,0.23584532737731934
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,7168,2048,8,256,32,2,balanced,0.2829599976539612
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,256,16,4,power_law_1.2,1.3177151679992676
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,7168,2048,8,256,32,2,balanced,0.319157342116038
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,256,16,4,power_law_1.2,1.8708288192749023
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,7168,2048,8,256,32,2,balanced,0.37284799416859943
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,256,16,4,power_law_1.2,3.0354496002197267
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,7168,2048,8,256,32,2,balanced,0.47916801770528156
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,256,16,4,power_law_1.2,3.611449432373047
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,256,16,4,power_law_1.2,4.5703166961669925
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,7168,2048,8,256,32,2,balanced,0.6131146748860677
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,256,16,4,power_law_1.2,7.486316680908203
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,7168,2048,8,256,32,2,balanced,0.8690933386484782
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,256,16,4,power_law_1.2,14.388978576660156
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,7168,2048,8,256,32,2,balanced,1.1183946927388508
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,7168,2048,8,256,32,2,balanced,1.645125389099121
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,7168,2048,8,256,32,2,balanced,0.0517439991235733
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,7168,2048,8,256,32,2,power_law_1.01,0.05803520083427429
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,7168,2048,8,256,32,2,balanced,0.05433600147565206
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,7168,2048,8,256,32,2,balanced,0.06355733176072438
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,7168,2048,8,256,32,2,power_law_1.01,0.06269440054893494
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,7168,2048,8,256,32,2,balanced,0.0775679995616277
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,7168,2048,8,256,32,2,balanced,0.10699733098347981
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,7168,2048,8,256,32,2,power_law_1.01,0.06407039761543273
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,7168,2048,8,256,32,2,balanced,0.15178666512171426
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,7168,2048,8,256,32,2,power_law_1.01,0.08805760145187377
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,7168,2048,8,256,32,2,balanced,1.9279786745707195
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,7168,2048,8,256,32,2,power_law_1.01,0.05162879824638367
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,7168,2048,8,256,32,2,balanced,0.1548746625582377
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,7168,2048,8,256,32,2,power_law_1.01,0.10720640420913696
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,7168,2048,8,256,32,2,balanced,0.1549066702524821
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,7168,2048,8,256,32,2,power_law_1.01,0.06381440162658691
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,7168,2048,8,256,32,2,balanced,0.1585599978764852
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,7168,2048,8,256,32,2,power_law_1.01,0.11863679885864258
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,7168,2048,8,256,32,2,power_law_1.01,0.056883198022842404
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,7168,2048,8,256,32,2,balanced,0.1586026648680369
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,7168,2048,8,256,32,2,power_law_1.01,0.14388480186462402
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,7168,2048,8,256,32,2,power_law_1.01,0.07289599776268005
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,7168,2048,8,256,32,2,balanced,0.16262400150299072
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,7168,2048,8,256,32,2,power_law_1.01,0.14740480184555055
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,7168,2048,8,256,32,2,power_law_1.01,0.0898688018321991
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,7168,2048,8,256,32,2,balanced,0.1655893325805664
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,7168,2048,8,256,32,2,power_law_1.01,0.14942079782485962
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,7168,2048,8,256,32,2,power_law_1.01,0.10191999673843384
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,7168,2048,8,256,32,2,balanced,0.16915732622146606
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,7168,2048,8,256,32,2,power_law_1.01,0.15222400426864624
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,7168,2048,8,256,32,2,power_law_1.01,0.12154239416122437
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,7168,2048,8,256,32,2,balanced,0.17163733641306558
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,7168,2048,8,256,32,2,balanced,2.604314645131429
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,7168,2048,8,256,32,2,power_law_1.01,0.1618239998817444
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,7168,2048,8,256,32,2,power_law_1.01,0.12936960458755492
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,7168,2048,8,256,32,2,balanced,0.18027200301488241
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,7168,2048,8,256,32,2,power_law_1.01,0.17126400470733644
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,7168,2048,8,256,32,2,power_law_1.01,0.13063679933547973
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,7168,2048,8,256,32,2,balanced,0.18542399009068808
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,7168,2048,8,256,32,2,power_law_1.01,0.1382464051246643
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,7168,2048,8,256,32,2,power_law_1.01,0.17221120595932007
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,7168,2048,8,256,32,2,balanced,0.1989120046297709
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,7168,2048,8,256,32,2,power_law_1.01,0.1441856026649475
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,7168,2048,8,256,32,2,power_law_1.01,0.1835584044456482
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,7168,2048,8,256,32,2,balanced,0.23442665735880533
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,7168,2048,8,256,32,2,power_law_1.01,0.15434880256652833
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,7168,2048,8,256,32,2,power_law_1.01,0.44012160301208497
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,7168,2048,8,256,32,2,power_law_1.01,0.1624511957168579
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,7168,2048,8,256,32,2,balanced,0.27291200558344525
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,7168,2048,8,256,32,2,power_law_1.01,1.178873634338379
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,7168,2048,8,256,32,2,power_law_1.01,0.17152639627456664
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,7168,2048,8,256,32,2,power_law_1.01,1.451871967315674
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,7168,2048,8,256,32,2,balanced,0.3156053423881531
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,7168,2048,8,256,32,2,power_law_1.01,0.18988800048828125
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,7168,2048,8,256,32,2,power_law_1.01,1.4887231826782226
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,7168,2048,8,256,32,2,power_law_1.01,0.2024064064025879
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,7168,2048,8,256,32,2,balanced,0.3603146473566691
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,7168,2048,8,256,32,2,power_law_1.01,1.511520004272461
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,7168,2048,8,256,32,2,power_law_1.01,0.21768319606781006
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,7168,2048,8,256,32,2,power_law_1.01,0.26138880252838137
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,7168,2048,8,256,32,2,power_law_1.01,2.809926414489746
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,7168,2048,8,256,32,2,balanced,0.472922682762146
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,7168,2048,8,256,32,2,power_law_1.01,0.28933119773864746
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,7168,2048,8,256,32,2,power_law_1.01,0.4085375785827637
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,7168,2048,8,256,32,2,balanced,3.745903968811035
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,7168,2048,8,256,32,2,power_law_1.01,0.34612479209899905
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,7168,2048,8,256,32,2,power_law_1.01,0.5560128211975097
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,7168,2048,8,256,32,2,balanced,0.6081120173136393
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,7168,2048,8,256,32,2,power_law_1.01,0.42677760124206543
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,7168,2048,8,256,32,2,power_law_1.01,0.6691775798797608
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,7168,2048,8,256,32,2,power_law_1.01,0.5356160163879394
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,7168,2048,8,256,32,2,power_law_1.01,0.9117952346801758
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,7168,2048,8,256,32,2,power_law_1.01,0.6757696151733399
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,7168,2048,8,256,32,2,power_law_1.01,1.1600255966186523
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,7168,2048,8,256,32,2,balanced,0.8749173482259115
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,7168,2048,8,256,32,2,power_law_1.01,0.9290111541748047
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,7168,2048,8,256,32,2,power_law_1.01,1.155833625793457
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,7168,2048,8,256,32,2,power_law_1.01,1.7517824172973633
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,7168,2048,8,256,32,2,power_law_1.01,1.7124736785888672
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,7168,2048,8,256,32,2,power_law_1.01,2.2895999908447267
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,7168,2048,8,256,32,2,power_law_1.01,2.296735954284668
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,7168,2048,8,256,32,2,power_law_1.01,2.653273582458496
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,7168,2048,8,256,32,2,balanced,1.1470879713694255
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,7168,2048,8,256,32,2,power_law_1.01,2.699193572998047
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,7168,2048,8,256,32,2,power_law_1.01,4.453593444824219
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,7168,2048,8,256,32,2,power_law_1.01,4.268544006347656
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,7168,2048,8,256,32,2,power_law_1.01,8.821932983398437
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,7168,2048,8,256,32,2,power_law_1.01,9.105017852783202
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,7168,2048,8,256,32,2,balanced,1.6925493876139324
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,7168,2048,8,256,32,2,balanced,2.0650026003519693
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,7168,2048,8,256,32,2,balanced,7.395194371541341
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,7168,2048,8,256,32,2,power_law_1.2,0.05848960280418396
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,7168,2048,8,256,32,2,power_law_1.2,0.0626688003540039
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,7168,2048,8,256,32,2,power_law_1.2,0.06607999801635742
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,7168,2048,8,256,32,2,balanced,2.7347520192464194
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,7168,2048,8,256,32,2,power_law_1.2,0.08244479894638061
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,7168,2048,8,256,32,2,power_law_1.2,0.09850239753723145
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,7168,2048,8,256,32,2,power_law_1.2,0.11290240287780762
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,7168,2048,8,256,32,2,power_law_1.2,0.1391808032989502
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,7168,2048,8,256,32,2,power_law_1.2,0.05173119902610779
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,7168,2048,8,256,32,2,power_law_1.2,0.14513280391693115
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,7168,2048,8,256,32,2,power_law_1.2,0.061536002159118655
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,7168,2048,8,256,32,2,power_law_1.2,0.14920320510864257
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,7168,2048,8,256,32,2,power_law_1.2,0.05794559717178345
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,7168,2048,8,256,32,2,power_law_1.2,0.15708800554275512
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,7168,2048,8,256,32,2,power_law_1.2,0.06963840126991272
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,7168,2048,8,256,32,2,power_law_1.2,0.0847487986087799
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,7168,2048,8,256,32,2,power_law_1.2,0.16779520511627197
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,7168,2048,8,256,32,2,power_law_1.2,0.09567360281944275
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,7168,2048,8,256,32,2,power_law_1.2,0.1710528016090393
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,7168,2048,8,256,32,2,power_law_1.2,0.11878399848937989
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,7168,2048,8,256,32,2,power_law_1.2,0.1735551953315735
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,7168,2048,8,256,32,2,balanced,4.0597225824991865
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,7168,2048,8,256,32,2,power_law_1.2,0.135206401348114
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,7168,2048,8,256,32,2,power_law_1.2,0.4300864219665527
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,7168,2048,8,256,32,2,power_law_1.2,0.12792960405349732
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,7168,2048,8,256,32,2,power_law_1.2,1.4086463928222657
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,7168,2048,8,256,32,2,power_law_1.2,0.1375040054321289
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,7168,2048,8,256,32,2,power_law_1.2,1.4276479721069335
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,7168,2048,8,256,32,2,power_law_1.2,0.148198401927948
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,7168,2048,8,256,32,2,power_law_1.2,1.4568384170532227
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,7168,2048,8,256,32,2,power_law_1.2,0.1534335970878601
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,7168,2048,8,256,32,2,power_law_1.2,1.5041152000427247
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,7168,2048,8,256,32,2,power_law_1.2,0.16286079883575438
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,7168,2048,8,256,32,2,power_law_1.2,1.5321151733398437
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,7168,2048,8,256,32,2,power_law_1.2,0.1815551996231079
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,7168,2048,8,256,32,2,power_law_1.2,0.19526400566101074
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,7168,2048,8,256,32,2,power_law_1.2,2.5523199081420898
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,7168,2048,8,256,32,2,power_law_1.2,0.21079039573669434
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,7168,2048,8,256,32,2,power_law_1.2,0.4288383960723877
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,7168,2048,8,256,32,2,power_law_1.2,0.22457599639892578
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,7168,2048,8,256,32,2,power_law_1.2,0.57608962059021
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,7168,2048,8,256,32,2,power_law_1.2,0.2760447978973389
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,7168,2048,8,256,32,2,power_law_1.2,0.6956607818603515
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,7168,2048,8,256,32,2,power_law_1.2,0.3036736011505127
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,7168,2048,8,256,32,2,power_law_1.2,0.9904064178466797
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,7168,2048,8,256,32,2,power_law_1.2,0.36745600700378417
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,7168,2048,8,256,32,2,power_law_1.2,1.2127360343933105
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,7168,2048,8,256,32,2,power_law_1.2,0.4301631927490234
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,7168,2048,8,256,32,2,power_law_1.2,1.7425151824951173
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,7168,2048,8,256,32,2,power_law_1.2,0.5498623847961426
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,7168,2048,8,256,32,2,power_law_1.2,2.2638271331787108
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,7168,2048,8,256,32,2,power_law_1.2,0.6918975830078125
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,7168,2048,8,256,32,2,power_law_1.2,0.9616640090942383
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,7168,2048,8,256,32,2,power_law_1.2,2.7715328216552733
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,7168,2048,8,256,32,2,power_law_1.2,1.2406720161437987
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,7168,2048,8,256,32,2,power_law_1.2,4.518841552734375
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,7168,2048,8,256,32,2,power_law_1.2,1.7678016662597655
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,7168,2048,8,256,32,2,power_law_1.2,2.3842239379882812
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,7168,2048,8,256,32,2,power_law_1.2,8.903558349609375
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,7168,2048,8,256,32,2,power_law_1.2,2.8463359832763673
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,7168,2048,8,256,32,2,balanced,8.035770416259766
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,7168,2048,8,256,32,2,power_law_1.2,4.572153472900391
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,7168,2048,8,256,32,2,power_law_1.2,9.992205047607422
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,2048,768,8,128,1,64,balanced,0.024400000770886738
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,2048,768,8,128,1,64,balanced,0.026874666412671406
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,2048,768,8,128,1,64,balanced,0.027615999182065327
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,2048,768,8,128,1,64,balanced,0.02874133239189784
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,2048,768,8,128,1,64,balanced,0.029850666721661884
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,2048,768,8,128,1,64,balanced,0.02826666583617528
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,2048,768,8,128,1,64,balanced,0.028223998844623566
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,2048,768,8,128,1,64,balanced,0.028394666810830433
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,2048,768,8,128,1,64,balanced,0.028143999477227528
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,2048,768,8,128,1,64,balanced,0.02871999889612198
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,2048,768,8,128,1,64,balanced,0.029669334491093952
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,2048,768,8,128,1,64,balanced,0.02940800040960312
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,2048,768,8,128,1,64,balanced,0.03017599880695343
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,2048,768,8,128,1,64,balanced,0.029866665601730347
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,2048,768,8,128,1,64,balanced,0.03606399893760681
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,2048,768,8,128,1,64,balanced,0.029701332251230877
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,2048,768,8,128,1,64,balanced,0.037503999968369804
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,2048,768,8,128,1,64,balanced,0.030837332208951313
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,2048,768,8,128,1,64,balanced,0.038165333370367684
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,2048,768,8,128,1,64,balanced,0.032042667269706726
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,2048,768,8,128,1,64,balanced,0.03939733405907949
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,2048,768,8,128,1,64,balanced,0.03332266708215078
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,2048,768,8,128,1,64,balanced,0.040789333482583366
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,2048,768,8,128,1,64,balanced,0.033573334415753685
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,2048,768,8,128,1,64,balanced,0.033861334125200905
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,2048,768,8,128,1,64,balanced,0.04042666653792063
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,2048,768,8,128,1,64,balanced,0.022869333624839783
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,2048,768,8,128,1,64,balanced,0.033626665671666466
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,2048,768,8,128,1,64,balanced,0.046906664967536926
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,2048,768,8,128,1,64,balanced,0.03375466664632162
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,2048,768,8,128,1,64,balanced,0.022869333624839783
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,2048,768,8,128,1,64,balanced,0.023103999594847362
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,2048,768,8,128,1,64,balanced,0.034490667283535004
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,2048,768,8,128,1,64,balanced,0.02447466552257538
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,2048,768,8,128,1,64,balanced,0.034832000732421875
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,2048,768,8,128,1,64,balanced,0.04540266593297323
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,2048,768,8,128,1,64,balanced,0.025568000972270966
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,2048,768,8,128,1,64,power_law_1.01,0.02479359954595566
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,2048,768,8,128,1,64,balanced,0.035205334424972534
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,2048,768,8,128,1,64,balanced,0.02679466704527537
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,2048,768,8,128,1,64,power_law_1.01,0.02834559977054596
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,2048,768,8,128,1,64,balanced,0.035829332967599235
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,2048,768,8,128,1,64,balanced,0.026799999177455902
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,2048,768,8,128,1,64,balanced,0.05299200117588043
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,2048,768,8,128,1,64,power_law_1.01,0.02810879945755005
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,2048,768,8,128,1,64,balanced,0.026901334524154663
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,2048,768,8,128,1,64,balanced,0.03700266778469086
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,2048,768,8,128,1,64,power_law_1.01,0.028678399324417115
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,2048,768,8,128,1,64,balanced,0.026922665536403656
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,2048,768,8,128,1,64,power_law_1.01,0.02911359965801239
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,2048,768,8,128,1,64,balanced,0.039306665460268654
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,2048,768,8,128,1,64,balanced,0.053488001227378845
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,2048,768,8,128,1,64,power_law_1.01,0.027423998713493346
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,2048,768,8,128,1,64,balanced,0.02757866680622101
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,2048,768,8,128,1,64,balanced,0.038917332887649536
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,2048,768,8,128,1,64,power_law_1.01,0.027456000447273254
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,2048,768,8,128,1,64,balanced,0.02784000088771184
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,2048,768,8,128,1,64,power_law_1.01,0.027744001150131224
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,2048,768,8,128,1,64,balanced,0.039349332451820374
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,2048,768,8,128,1,64,balanced,0.02794133375088374
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,2048,768,8,128,1,64,power_law_1.01,0.031200000643730165
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,2048,768,8,128,1,64,power_law_1.01,0.03208320140838623
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,2048,768,8,128,1,64,balanced,0.06442666550477345
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,2048,768,8,128,1,64,balanced,0.028789333999156952
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,2048,768,8,128,1,64,balanced,0.04089066634575526
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,2048,768,8,128,1,64,power_law_1.01,0.03392640054225922
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,2048,768,8,128,1,64,balanced,0.029258665939172108
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,2048,768,8,128,1,64,power_law_1.01,0.034143999218940735
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,2048,768,8,128,1,64,balanced,0.04244266450405121
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,2048,768,8,128,1,64,power_law_1.01,0.034796801209449765
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,2048,768,8,128,1,64,balanced,0.03179199993610382
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,2048,768,8,128,1,64,power_law_1.01,0.03901439905166626
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,2048,768,8,128,1,64,balanced,0.045125335454940796
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,2048,768,8,128,1,64,balanced,0.031013332307338715
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,2048,768,8,128,1,64,power_law_1.01,0.04444800019264221
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,2048,768,8,128,1,64,balanced,0.06866133213043213
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,2048,768,8,128,1,64,power_law_1.01,0.04907520115375519
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,2048,768,8,128,1,64,power_law_1.01,0.05324800014495849
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,2048,768,8,128,1,64,balanced,0.04795733094215393
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,2048,768,8,128,1,64,power_law_1.01,0.061427199840545656
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,2048,768,8,128,1,64,power_law_1.01,0.06567040085792542
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,2048,768,8,128,1,64,power_law_1.01,0.08008319735527039
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,2048,768,8,128,1,64,balanced,0.06301866471767426
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,2048,768,8,128,1,64,balanced,0.03259200106064478
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,2048,768,8,128,1,64,power_law_1.01,0.07651839852333069
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,2048,768,8,128,1,64,power_law_1.01,0.09581440091133117
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,2048,768,8,128,1,64,balanced,0.03465066601832708
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,2048,768,8,128,1,64,power_law_1.01,0.09845119714736938
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,2048,768,8,128,1,64,balanced,0.0942133367061615
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,2048,768,8,128,1,64,balanced,0.06945066650708516
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,2048,768,8,128,1,64,power_law_1.01,0.12400640249252319
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,2048,768,8,128,1,64,balanced,0.03409600009520849
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,2048,768,8,128,1,64,power_law_1.01,0.15953279733657838
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,2048,768,8,128,1,64,power_law_1.01,0.24160640239715575
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,2048,768,8,128,1,64,power_law_1.01,0.2835903882980347
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,2048,768,8,128,1,64,balanced,0.08937600255012512
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,2048,768,8,128,1,64,power_law_1.01,0.3878400087356567
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,2048,768,8,128,1,64,power_law_1.01,0.6150015830993653
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,2048,768,8,128,1,64,balanced,0.03931200007597605
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,2048,768,8,128,1,64,power_law_1.01,1.1706687927246093
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,2048,768,8,128,1,64,balanced,0.10074667135874431
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,2048,768,8,128,1,64,balanced,0.04095999896526337
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,2048,768,8,128,1,64,balanced,0.10407466689745586
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,2048,768,8,128,1,64,balanced,0.04891733328501383
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,2048,768,8,128,1,64,balanced,0.13717866937319437
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,2048,768,8,128,1,64,balanced,0.0532533327738444
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,2048,768,8,128,1,64,balanced,0.1151626706123352
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,2048,768,8,128,1,64,balanced,0.16405333081881204
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,2048,768,8,128,1,64,balanced,0.07150400181611379
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,2048,768,8,128,1,64,balanced,0.16010133425394693
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,2048,768,8,128,1,64,balanced,0.19221866130828857
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,2048,768,8,128,1,64,balanced,0.08463999629020691
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,2048,768,8,128,1,64,power_law_1.2,0.02545279860496521
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,2048,768,8,128,1,64,power_law_1.01,0.03415040075778961
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,2048,768,8,128,1,64,power_law_1.2,0.027372801303863527
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,2048,768,8,128,1,64,power_law_1.01,0.03204480111598969
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,2048,768,8,128,1,64,power_law_1.2,0.026732799410820008
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,2048,768,8,128,1,64,power_law_1.01,0.030559998750686646
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,2048,768,8,128,1,64,power_law_1.01,0.023027199506759643
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,2048,768,8,128,1,64,power_law_1.2,0.02858240008354187
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,2048,768,8,128,1,64,power_law_1.01,0.032204800844192506
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,2048,768,8,128,1,64,power_law_1.01,0.032518398761749265
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,2048,768,8,128,1,64,power_law_1.2,0.029311999678611755
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,2048,768,8,128,1,64,power_law_1.01,0.023219199478626253
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,2048,768,8,128,1,64,balanced,0.1162453293800354
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,2048,768,8,128,1,64,power_law_1.01,0.03293440043926239
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,2048,768,8,128,1,64,power_law_1.2,0.02746239900588989
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,2048,768,8,128,1,64,power_law_1.01,0.02279680073261261
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,2048,768,8,128,1,64,power_law_1.01,0.03338879942893982
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,2048,768,8,128,1,64,power_law_1.2,0.027558401226997375
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,2048,768,8,128,1,64,power_law_1.01,0.024876800179481507
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,2048,768,8,128,1,64,power_law_1.01,0.03369599878787995
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,2048,768,8,128,1,64,power_law_1.2,0.02871679961681366
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,2048,768,8,128,1,64,power_law_1.01,0.025600001215934753
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,2048,768,8,128,1,64,power_law_1.01,0.034176000952720643
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,2048,768,8,128,1,64,power_law_1.2,0.03301759958267212
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,2048,768,8,128,1,64,power_law_1.01,0.026495999097824095
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,2048,768,8,128,1,64,power_law_1.2,0.033542400598526
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,2048,768,8,128,1,64,power_law_1.01,0.034835198521614076
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,2048,768,8,128,1,64,power_law_1.01,0.02690559923648834
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,2048,768,8,128,1,64,power_law_1.2,0.03395200073719025
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,2048,768,8,128,1,64,power_law_1.01,0.03555200099945068
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,2048,768,8,128,1,64,power_law_1.2,0.034790399670600894
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,2048,768,8,128,1,64,power_law_1.01,0.02696320116519928
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,2048,768,8,128,1,64,power_law_1.01,0.03583999872207642
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,2048,768,8,128,1,64,balanced,0.1425493359565735
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,2048,768,8,128,1,64,balanced,0.2835093339284261
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,2048,768,8,128,1,64,power_law_1.2,0.03506560027599335
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,2048,768,8,128,1,64,power_law_1.01,0.026950401067733765
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,2048,768,8,128,1,64,power_law_1.01,0.03666560053825378
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,2048,768,8,128,1,64,power_law_1.2,0.04154239892959595
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,2048,768,8,128,1,64,power_law_1.01,0.02710399925708771
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,2048,768,8,128,1,64,power_law_1.01,0.03783040046691895
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,2048,768,8,128,1,64,power_law_1.2,0.034892800450325015
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,2048,768,8,128,1,64,power_law_1.01,0.04002560079097748
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,2048,768,8,128,1,64,power_law_1.2,0.04364160001277924
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,2048,768,8,128,1,64,power_law_1.01,0.027923199534416198
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,2048,768,8,128,1,64,power_law_1.2,0.031001600623130798
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,2048,768,8,128,1,64,power_law_1.01,0.040268799662590025
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,2048,768,8,128,1,64,power_law_1.2,0.047968000173568726
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,2048,768,8,128,1,64,power_law_1.01,0.02869119942188263
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,2048,768,8,128,1,64,power_law_1.2,0.03028480112552643
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,2048,768,8,128,1,64,power_law_1.01,0.04382080137729645
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,2048,768,8,128,1,64,power_law_1.2,0.05617280006408691
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,2048,768,8,128,1,64,power_law_1.01,0.029267200827598573
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,2048,768,8,128,1,64,power_law_1.2,0.032467201352119446
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,2048,768,8,128,1,64,power_law_1.01,0.05110399723052979
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,2048,768,8,128,1,64,power_law_1.2,0.06696320176124573
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,2048,768,8,128,1,64,power_law_1.01,0.030137598514556885
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,2048,768,8,128,1,64,power_law_1.2,0.032364800572395325
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,2048,768,8,128,1,64,power_law_1.01,0.05459840297698974
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,2048,768,8,128,1,64,power_law_1.2,0.0757695972919464
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,2048,768,8,128,1,64,power_law_1.01,0.03420799970626831
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,2048,768,8,128,1,64,power_law_1.2,0.033292800188064575
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,2048,768,8,128,1,64,power_law_1.01,0.06794880032539367
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,2048,768,8,128,1,64,power_law_1.2,0.11271040439605713
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,2048,768,8,128,1,64,power_law_1.01,0.03758080005645752
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,2048,768,8,128,1,64,power_law_1.2,0.0333759993314743
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,2048,768,8,128,1,64,power_law_1.01,0.07368959784507752
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,2048,768,8,128,1,64,power_law_1.2,0.09201920032501221
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,2048,768,8,128,1,64,power_law_1.2,0.03361279964447021
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,2048,768,8,128,1,64,power_law_1.01,0.0971455991268158
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,2048,768,8,128,1,64,power_law_1.2,0.13107839822769166
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,2048,768,8,128,1,64,balanced,0.28062933683395386
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,2048,768,8,128,1,64,power_law_1.01,0.04323840141296387
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,2048,768,8,128,1,64,power_law_1.2,0.03403519988059998
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,2048,768,8,128,1,64,power_law_1.01,0.10859520435333252
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,2048,768,8,128,1,64,power_law_1.2,0.13129600286483764
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,2048,768,8,128,1,64,power_law_1.01,0.05644800066947937
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,2048,768,8,128,1,64,power_law_1.2,0.03421440124511719
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,2048,768,8,128,1,64,power_law_1.01,0.13980799913406372
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,2048,768,8,128,1,64,power_law_1.2,0.1819391965866089
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,2048,768,8,128,1,64,balanced,0.17018133401870728
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,2048,768,8,128,1,64,power_law_1.01,0.0606719970703125
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,2048,768,8,128,1,64,power_law_1.2,0.035488000512123107
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,2048,768,8,128,1,64,power_law_1.01,0.18042240142822266
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,2048,768,8,128,1,64,power_law_1.2,0.25922560691833496
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,2048,768,8,128,1,64,power_law_1.2,0.03583999872207642
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,2048,768,8,128,1,64,power_law_1.01,0.271891188621521
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,2048,768,8,128,1,64,power_law_1.2,0.37058560848236083
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,2048,768,8,128,1,64,power_law_1.2,0.036575999855995175
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,2048,768,8,128,1,64,power_law_1.01,0.06677119731903076
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,2048,768,8,128,1,64,power_law_1.01,0.3452928066253662
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,2048,768,8,128,1,64,power_law_1.2,0.4601088047027588
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,2048,768,8,128,1,64,power_law_1.2,0.03761920034885406
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,2048,768,8,128,1,64,power_law_1.01,0.08744959831237793
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,2048,768,8,128,1,64,power_law_1.01,0.4610879898071289
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,2048,768,8,128,1,64,power_law_1.2,0.04040960073471069
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,2048,768,8,128,1,64,power_law_1.2,0.5497727870941163
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,2048,768,8,128,1,64,power_law_1.01,0.5814527988433837
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,2048,768,8,128,1,64,power_law_1.2,0.04215039908885956
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,2048,768,8,128,1,64,power_law_1.2,1.05413761138916
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,2048,768,8,128,1,64,power_law_1.01,0.10306559801101685
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,2048,768,8,128,1,64,power_law_1.2,0.04769279956817627
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,2048,768,8,128,1,64,power_law_1.01,1.3285311698913573
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,2048,768,8,128,1,64,power_law_1.2,2.3628671646118162
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,2048,768,8,128,1,64,power_law_1.01,0.12573440074920655
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,2048,768,8,128,1,64,power_law_1.2,0.05498239994049072
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,2048,768,8,128,1,64,power_law_1.2,0.05759360194206238
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,2048,768,8,128,1,64,power_law_1.01,0.19010560512542723
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,2048,768,8,128,1,64,power_law_1.2,0.07431679964065552
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,2048,768,8,128,1,64,balanced,0.5221226612726847
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,2048,768,8,128,1,64,power_law_1.2,0.08184319734573364
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,2048,768,8,128,1,64,balanced,0.25380800167719525
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,2048,768,8,128,1,64,power_law_1.01,0.23637120723724364
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,2048,768,8,128,1,64,power_law_1.2,0.12353279590606689
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,2048,768,8,128,1,64,power_law_1.01,0.37731199264526366
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,2048,768,8,128,1,64,power_law_1.2,0.13693439960479736
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,2048,768,8,128,1,64,power_law_1.01,0.47720961570739745
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,2048,768,8,128,1,64,power_law_1.2,0.2045759916305542
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,2048,768,8,128,1,64,power_law_1.2,0.24645121097564698
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,2048,768,8,128,1,64,power_law_1.2,0.35966079235076903
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,2048,768,8,128,1,64,power_law_1.01,0.5100287914276123
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,2048,768,8,128,1,64,power_law_1.2,0.46375041007995604
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,2048,768,8,128,1,64,power_law_1.01,0.9115584373474122
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,2048,768,8,128,1,64,power_law_1.2,0.6125184059143066
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,2048,768,8,128,1,64,power_law_1.01,1.9492992401123046
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,2048,768,8,128,1,64,power_law_1.2,1.10314884185791
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,2048,768,8,128,1,64,power_law_1.2,0.022886399924755097
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,2048,768,8,128,1,64,power_law_1.2,2.3764671325683593
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,2048,768,8,128,1,64,power_law_1.2,0.022540800273418427
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,2048,768,8,128,1,64,power_law_1.2,0.02279040068387985
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,2048,768,8,128,1,64,power_law_1.2,0.024799999594688416
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,2048,768,8,128,1,64,power_law_1.2,0.02542720139026642
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,2048,768,8,128,1,64,power_law_1.2,0.02625280022621155
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,2048,768,8,128,1,64,power_law_1.2,0.026918399333953857
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,2048,768,8,128,1,64,power_law_1.2,0.02705279886722565
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,2048,768,8,128,1,64,power_law_1.2,0.027244800329208375
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,2048,768,8,128,1,64,power_law_1.2,0.02746239900588989
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,2048,768,8,128,1,64,power_law_1.2,0.028064000606536865
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,2048,768,8,128,1,64,power_law_1.2,0.028857600688934327
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,2048,768,8,128,1,64,power_law_1.2,0.029241600632667543
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,2048,768,8,128,1,64,power_law_1.2,0.03260799944400787
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,2048,768,8,128,1,64,power_law_1.2,0.03815680146217346
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,2048,768,8,128,1,64,power_law_1.2,0.039699199795722964
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,2048,768,8,128,1,64,balanced,0.506767988204956
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,2048,768,8,128,1,64,power_law_1.2,0.049619200825691226
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,2048,768,8,128,1,64,power_law_1.2,0.058899199962615965
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,2048,768,8,128,1,64,power_law_1.2,0.07400320172309875
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,2048,768,8,128,1,64,power_law_1.2,0.09365119934082031
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,2048,768,8,128,1,64,power_law_1.2,0.11083519458770752
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,2048,768,8,128,1,64,power_law_1.2,0.13265279531478882
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,2048,768,8,128,1,64,power_law_1.2,0.17788159847259521
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,2048,768,8,128,1,64,power_law_1.2,0.28873600959777834
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,2048,768,8,128,1,64,power_law_1.2,0.4010176181793213
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,2048,768,8,128,1,64,power_law_1.2,0.5460288047790527
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,2048,768,8,128,1,64,power_law_1.2,0.844422435760498
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,2048,768,8,128,1,64,power_law_1.2,1.0723711967468261
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,2048,768,8,128,1,64,power_law_1.2,1.6962303161621093
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,2048,768,8,128,1,64,power_law_1.2,3.5436416625976563
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,2048,768,8,128,2,32,balanced,0.025733334322770435
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,2048,768,8,128,2,32,balanced,0.022810667753219604
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,2048,768,8,128,2,32,balanced,0.02274666726589203
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,2048,768,8,128,2,32,balanced,0.02404800057411194
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,2048,768,8,128,2,32,balanced,0.02513066679239273
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,2048,768,8,128,2,32,balanced,0.02645866572856903
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,2048,768,8,128,2,32,balanced,0.0269813338915507
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,2048,768,8,128,2,32,balanced,0.027098665634791057
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,2048,768,8,128,2,32,balanced,0.026528000831604004
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,2048,768,8,128,2,32,balanced,0.027237333357334137
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,2048,768,8,128,2,32,balanced,0.027749332288901012
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,2048,768,8,128,2,32,balanced,0.027818667391935985
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,2048,768,8,128,2,32,balanced,0.028607999285062153
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,2048,768,8,128,2,32,balanced,0.03469333300987879
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,2048,768,8,128,2,32,balanced,0.03661333272854487
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,2048,768,8,128,2,32,balanced,0.03633599976698557
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,2048,768,8,128,2,32,balanced,0.03048533449570338
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,2048,768,8,128,2,32,balanced,0.03827200084924698
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,2048,768,8,128,2,32,balanced,0.028965334097544353
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,2048,768,8,128,2,32,balanced,0.039813332259655
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,2048,768,8,128,2,32,balanced,0.029146666328112285
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,2048,768,8,128,2,32,balanced,0.03149333347876867
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,2048,768,8,128,2,32,power_law_1.01,0.026291200518608095
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,2048,768,8,128,2,32,balanced,0.04182933270931244
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,2048,768,8,128,2,32,balanced,0.0330826664964358
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,2048,768,8,128,2,32,power_law_1.01,0.02290560007095337
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,2048,768,8,128,2,32,balanced,0.03366933266321818
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,2048,768,8,128,2,32,balanced,0.04728533327579498
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,2048,768,8,128,2,32,power_law_1.01,0.022169600427150726
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,2048,768,8,128,2,32,balanced,0.03355200091997782
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,2048,768,8,128,2,32,power_law_1.01,0.0236735999584198
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,2048,768,8,128,2,32,balanced,0.03362133353948593
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,2048,768,8,128,2,32,balanced,0.045456002155939736
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,2048,768,8,128,2,32,power_law_1.01,0.024588799476623534
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,2048,768,8,128,2,32,power_law_1.01,0.035820800065994265
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,2048,768,8,128,2,32,balanced,0.03450666616360346
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,2048,768,8,128,2,32,power_law_1.01,0.025862398743629455
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,2048,768,8,128,2,32,power_law_1.01,0.030963200330734252
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,2048,768,8,128,2,32,balanced,0.034245334565639496
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,2048,768,8,128,2,32,balanced,0.05600533386071523
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,2048,768,8,128,2,32,balanced,0.022815999885400135
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,2048,768,8,128,2,32,power_law_1.01,0.026035198569297792
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,2048,768,8,128,2,32,power_law_1.01,0.02967039942741394
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,2048,768,8,128,2,32,balanced,0.03484266748030981
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,2048,768,8,128,2,32,balanced,0.023029332359631855
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,2048,768,8,128,2,32,power_law_1.01,0.028966400027275085
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,2048,768,8,128,2,32,power_law_1.01,0.03187200129032135
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,2048,768,8,128,2,32,balanced,0.03480000048875809
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,2048,768,8,128,2,32,balanced,0.023007998863856
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,2048,768,8,128,2,32,power_law_1.01,0.03121280074119568
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,2048,768,8,128,2,32,balanced,0.05676800012588501
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,2048,768,8,128,2,32,power_law_1.01,0.031711998581886294
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,2048,768,8,128,2,32,balanced,0.03562666724125544
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,2048,768,8,128,2,32,balanced,0.02479466547568639
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,2048,768,8,128,2,32,power_law_1.01,0.030451199412345885
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,2048,768,8,128,2,32,power_law_1.01,0.03304319977760315
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,2048,768,8,128,2,32,balanced,0.03668266783157984
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,2048,768,8,128,2,32,balanced,0.026186667382717133
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,2048,768,8,128,2,32,power_law_1.01,0.032595199346542356
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,2048,768,8,128,2,32,power_law_1.01,0.03320319950580597
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,2048,768,8,128,2,32,balanced,0.02714666724205017
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,2048,768,8,128,2,32,balanced,0.03892799963553747
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,2048,768,8,128,2,32,balanced,0.07011199990908305
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,2048,768,8,128,2,32,power_law_1.01,0.03330560028553009
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,2048,768,8,128,2,32,power_law_1.01,0.03351680040359497
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,2048,768,8,128,2,32,balanced,0.027104000250498455
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,2048,768,8,128,2,32,balanced,0.03842666745185852
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,2048,768,8,128,2,32,power_law_1.01,0.03345920145511627
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,2048,768,8,128,2,32,power_law_1.01,0.033766400814056394
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,2048,768,8,128,2,32,power_law_1.01,0.023660799860954283
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,2048,768,8,128,2,32,balanced,0.027258666853109997
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,2048,768,8,128,2,32,balanced,0.03972266614437103
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,2048,768,8,128,2,32,power_law_1.01,0.03397760093212128
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,2048,768,8,128,2,32,power_law_1.01,0.036601600050926206
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,2048,768,8,128,2,32,balanced,0.027450665831565857
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,2048,768,8,128,2,32,power_law_1.01,0.022950400412082673
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,2048,768,8,128,2,32,power_law_1.01,0.03491199910640717
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,2048,768,8,128,2,32,balanced,0.04135466615358988
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,2048,768,8,128,2,32,power_law_1.01,0.02290560007095337
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,2048,768,8,128,2,32,power_law_1.01,0.03898879885673523
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,2048,768,8,128,2,32,balanced,0.028037334481875103
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,2048,768,8,128,2,32,balanced,0.0777706652879715
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,2048,768,8,128,2,32,power_law_1.01,0.024908800423145295
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,2048,768,8,128,2,32,power_law_1.01,0.03607040047645569
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,2048,768,8,128,2,32,balanced,0.028223998844623566
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,2048,768,8,128,2,32,power_law_1.01,0.040249601006507874
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,2048,768,8,128,2,32,balanced,0.042319998145103455
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,2048,768,8,128,2,32,power_law_1.01,0.02568320035934448
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,2048,768,8,128,2,32,power_law_1.01,0.03703039884567261
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,2048,768,8,128,2,32,power_law_1.01,0.026713600754737853
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,2048,768,8,128,2,32,balanced,0.028522667785485584
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,2048,768,8,128,2,32,power_law_1.01,0.04352000057697296
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,2048,768,8,128,2,32,power_law_1.01,0.027167999744415285
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,2048,768,8,128,2,32,balanced,0.04915200173854828
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,2048,768,8,128,2,32,power_law_1.01,0.03849599957466125
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,2048,768,8,128,2,32,balanced,0.029002666473388672
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,2048,768,8,128,2,32,power_law_1.01,0.050419199466705325
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,2048,768,8,128,2,32,power_law_1.01,0.02717440128326416
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,2048,768,8,128,2,32,power_law_1.01,0.040761598944664
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,2048,768,8,128,2,32,balanced,0.02956799914439519
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,2048,768,8,128,2,32,power_law_1.01,0.027456000447273254
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,2048,768,8,128,2,32,power_law_1.01,0.061312001943588254
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,2048,768,8,128,2,32,balanced,0.049728001157442726
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,2048,768,8,128,2,32,power_law_1.01,0.02807680070400238
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,2048,768,8,128,2,32,power_law_1.01,0.04325119853019714
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,2048,768,8,128,2,32,balanced,0.033439998825391136
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,2048,768,8,128,2,32,power_law_1.01,0.07181439995765686
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,2048,768,8,128,2,32,power_law_1.01,0.02898559868335724
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,2048,768,8,128,2,32,balanced,0.10609066486358643
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,2048,768,8,128,2,32,power_law_1.01,0.04309119880199432
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,2048,768,8,128,2,32,power_law_1.01,0.030316799879074097
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,2048,768,8,128,2,32,power_law_1.01,0.06719359755516052
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,2048,768,8,128,2,32,balanced,0.03236266722281774
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,2048,768,8,128,2,32,balanced,0.06529599924882253
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,2048,768,8,128,2,32,power_law_1.01,0.031539198756217954
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,2048,768,8,128,2,32,power_law_1.01,0.047443199157714847
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,2048,768,8,128,2,32,power_law_1.01,0.08618879914283753
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,2048,768,8,128,2,32,power_law_1.01,0.03407999873161316
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,2048,768,8,128,2,32,power_law_1.01,0.055078399181365964
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,2048,768,8,128,2,32,power_law_1.01,0.09530240297317505
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,2048,768,8,128,2,32,power_law_1.01,0.035692799091339114
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,2048,768,8,128,2,32,power_law_1.01,0.0382207989692688
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,2048,768,8,128,2,32,power_law_1.01,0.07171840071678162
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,2048,768,8,128,2,32,balanced,0.07381333410739899
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,2048,768,8,128,2,32,power_law_1.2,0.026630398631095887
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,2048,768,8,128,2,32,power_law_1.01,0.13036799430847168
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,2048,768,8,128,2,32,power_law_1.01,0.06968960165977478
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,2048,768,8,128,2,32,balanced,0.03378133227427801
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,2048,768,8,128,2,32,power_law_1.01,0.1471743941307068
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,2048,768,8,128,2,32,power_law_1.2,0.021881599724292756
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,2048,768,8,128,2,32,power_law_1.01,0.09015039801597595
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,2048,768,8,128,2,32,power_law_1.01,0.04247680008411407
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,2048,768,8,128,2,32,power_law_1.01,0.2031872034072876
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,2048,768,8,128,2,32,power_law_1.2,0.02205439954996109
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,2048,768,8,128,2,32,balanced,0.03602666656176249
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,2048,768,8,128,2,32,power_law_1.01,0.05017600059509277
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,2048,768,8,128,2,32,power_law_1.01,0.10652799606323242
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,2048,768,8,128,2,32,balanced,0.09571199615796407
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,2048,768,8,128,2,32,balanced,0.11538666486740112
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,2048,768,8,128,2,32,power_law_1.01,0.061868798732757566
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,2048,768,8,128,2,32,power_law_1.2,0.023507200181484222
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,2048,768,8,128,2,32,power_law_1.01,0.2755392074584961
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,2048,768,8,128,2,32,balanced,0.03618666778008143
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,2048,768,8,128,2,32,power_law_1.01,0.14109439849853517
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,2048,768,8,128,2,32,power_law_1.2,0.024447999894618988
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,2048,768,8,128,2,32,power_law_1.01,0.3071104049682617
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,2048,768,8,128,2,32,power_law_1.01,0.1699455976486206
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,2048,768,8,128,2,32,power_law_1.2,0.025868800282478333
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,2048,768,8,128,2,32,power_law_1.01,0.267903995513916
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,2048,768,8,128,2,32,power_law_1.01,0.46654720306396485
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,2048,768,8,128,2,32,power_law_1.2,0.026067200303077697
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,2048,768,8,128,2,32,balanced,0.10945066809654236
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,2048,768,8,128,2,32,power_law_1.01,0.06659200191497802
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,2048,768,8,128,2,32,balanced,0.04219200213750204
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,2048,768,8,128,2,32,power_law_1.01,0.3180223941802979
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,2048,768,8,128,2,32,power_law_1.2,0.029126399755477907
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,2048,768,8,128,2,32,power_law_1.01,0.0870848000049591
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,2048,768,8,128,2,32,power_law_1.01,1.1542271614074706
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,2048,768,8,128,2,32,power_law_1.2,0.03118079900741577
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,2048,768,8,128,2,32,power_law_1.01,0.4148287773132324
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,2048,768,8,128,2,32,balanced,0.04533333579699198
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,2048,768,8,128,2,32,power_law_1.2,0.03166080117225647
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,2048,768,8,128,2,32,power_law_1.01,0.6400576114654541
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,2048,768,8,128,2,32,power_law_1.01,0.10391039848327636
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,2048,768,8,128,2,32,power_law_1.2,0.03252480030059814
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,2048,768,8,128,2,32,power_law_1.01,0.13564800024032592
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,2048,768,8,128,2,32,balanced,0.13225066661834717
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,2048,768,8,128,2,32,power_law_1.2,0.03397760093212128
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,2048,768,8,128,2,32,power_law_1.01,1.3680959701538087
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,2048,768,8,128,2,32,balanced,0.056426664193471275
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,2048,768,8,128,2,32,balanced,0.15042133132616678
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,2048,768,8,128,2,32,power_law_1.2,0.03383040130138397
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,2048,768,8,128,2,32,power_law_1.2,0.03638400137424469
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,2048,768,8,128,2,32,balanced,0.06291733185450236
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,2048,768,8,128,2,32,power_law_1.2,0.039103999733924866
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,2048,768,8,128,2,32,power_law_1.01,0.16244479417800903
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,2048,768,8,128,2,32,power_law_1.2,0.03971199989318848
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,2048,768,8,128,2,32,power_law_1.2,0.04971520006656647
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,2048,768,8,128,2,32,power_law_1.2,0.05375360250473023
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,2048,768,8,128,2,32,power_law_1.01,0.2171583890914917
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,2048,768,8,128,2,32,balanced,0.18129066626230875
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,2048,768,8,128,2,32,balanced,0.08518399794896443
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,2048,768,8,128,2,32,power_law_1.2,0.06451839804649354
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,2048,768,8,128,2,32,power_law_1.01,0.4229695796966553
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,2048,768,8,128,2,32,power_law_1.2,0.036313599348068236
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,2048,768,8,128,2,32,power_law_1.2,0.0770367980003357
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,2048,768,8,128,2,32,power_law_1.01,0.5014016151428222
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,2048,768,8,128,2,32,power_law_1.2,0.07804160118103028
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,2048,768,8,128,2,32,power_law_1.01,0.7364480018615722
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,2048,768,8,128,2,32,power_law_1.2,0.030067199468612672
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,2048,768,8,128,2,32,power_law_1.2,0.029600000381469725
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,2048,768,8,128,2,32,power_law_1.2,0.10314240455627441
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,2048,768,8,128,2,32,power_law_1.01,0.958732795715332
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,2048,768,8,128,2,32,power_law_1.2,0.03155199885368347
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,2048,768,8,128,2,32,power_law_1.2,0.10577919483184814
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,2048,768,8,128,2,32,balanced,0.1941866676012675
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,2048,768,8,128,2,32,balanced,0.10086400310198466
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,2048,768,8,128,2,32,power_law_1.01,1.872800064086914
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,2048,768,8,128,2,32,power_law_1.2,0.03182080090045929
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,2048,768,8,128,2,32,power_law_1.2,0.16844160556793214
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,2048,768,8,128,2,32,power_law_1.2,0.033062401413917544
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,2048,768,8,128,2,32,power_law_1.2,0.2361920118331909
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,2048,768,8,128,2,32,power_law_1.2,0.03326080143451691
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,2048,768,8,128,2,32,power_law_1.2,0.2962048053741455
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,2048,768,8,128,2,32,balanced,0.21598400672276816
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,2048,768,8,128,2,32,power_law_1.2,0.033542400598526
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,2048,768,8,128,2,32,power_law_1.2,0.36417279243469236
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,2048,768,8,128,2,32,power_law_1.2,0.03372800052165985
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,2048,768,8,128,2,32,power_law_1.2,0.6534783840179443
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,2048,768,8,128,2,32,power_law_1.2,0.034169599413871765
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,2048,768,8,128,2,32,balanced,0.14109866817792258
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,2048,768,8,128,2,32,power_law_1.2,0.03557760119438171
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,2048,768,8,128,2,32,power_law_1.2,0.7200831890106201
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,2048,768,8,128,2,32,power_law_1.2,0.036499199271202085
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,2048,768,8,128,2,32,power_law_1.2,2.2267583847045898
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,2048,768,8,128,2,32,power_law_1.2,0.03722879886627197
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,2048,768,8,128,2,32,power_law_1.2,0.03797119855880737
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,2048,768,8,128,2,32,power_law_1.2,0.04230400025844574
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,2048,768,8,128,2,32,power_law_1.2,0.04402559995651245
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,2048,768,8,128,2,32,balanced,0.17654933532079062
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,2048,768,8,128,2,32,power_law_1.2,0.04501760005950928
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,2048,768,8,128,2,32,power_law_1.2,0.05504639744758606
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,2048,768,8,128,2,32,balanced,0.32201067606608075
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,2048,768,8,128,2,32,power_law_1.2,0.06038399934768677
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,2048,768,8,128,2,32,power_law_1.2,0.07745919823646545
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,2048,768,8,128,2,32,power_law_1.2,0.07900159955024719
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,2048,768,8,128,2,32,power_law_1.2,0.10703359842300415
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,2048,768,8,128,2,32,power_law_1.2,0.13320319652557372
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,2048,768,8,128,2,32,balanced,0.2143253286679586
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,2048,768,8,128,2,32,power_law_1.2,0.1801344037055969
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,2048,768,8,128,2,32,power_law_1.2,0.2339008092880249
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,2048,768,8,128,2,32,balanced,0.3461493253707886
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,2048,768,8,128,2,32,power_law_1.2,0.34968318939208987
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,2048,768,8,128,2,32,power_law_1.2,0.4819200038909912
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,2048,768,8,128,2,32,power_law_1.2,0.47675518989562987
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,2048,768,8,128,2,32,power_law_1.2,1.1065792083740233
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,2048,768,8,128,2,32,power_law_1.2,2.5038015365600588
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,2048,768,8,128,2,32,balanced,0.3450133403142293
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,2048,768,8,128,2,32,balanced,0.6029280026753744
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,2048,768,8,128,2,32,balanced,0.6650453408559164
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,2048,768,8,128,4,16,balanced,0.022463999688625336
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,2048,768,8,128,4,16,balanced,0.022181332111358643
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,2048,768,8,128,4,16,balanced,0.022218666970729828
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,2048,768,8,128,2,32,power_law_1.2,0.023795199394226075
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,2048,768,8,128,4,16,balanced,0.023893333971500397
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,2048,768,8,128,2,32,power_law_1.2,0.022617599368095397
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,2048,768,8,128,2,32,power_law_1.2,0.02309119999408722
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,2048,768,8,128,4,16,balanced,0.025616000096003216
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,2048,768,8,128,2,32,power_law_1.2,0.025177600979804992
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,2048,768,8,128,4,16,balanced,0.02699200063943863
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,2048,768,8,128,2,32,power_law_1.2,0.02573440074920654
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,2048,768,8,128,2,32,power_law_1.2,0.026969599723815917
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,2048,768,8,128,4,16,balanced,0.027093333502610523
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,2048,768,8,128,2,32,power_law_1.2,0.027193599939346315
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,2048,768,8,128,4,16,balanced,0.027269333600997925
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,2048,768,8,128,2,32,power_law_1.2,0.027449598908424376
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,2048,768,8,128,4,16,balanced,0.026917333404223125
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,2048,768,8,128,2,32,power_law_1.2,0.028262400627136232
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,2048,768,8,128,4,16,balanced,0.027514666318893433
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,2048,768,8,128,2,32,power_law_1.2,0.027878400683403016
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,2048,768,8,128,2,32,power_law_1.2,0.029203200340270997
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,2048,768,8,128,4,16,balanced,0.027866666515668232
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,2048,768,8,128,2,32,power_law_1.2,0.030131199955940248
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,2048,768,8,128,4,16,balanced,0.028389332195123036
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,2048,768,8,128,2,32,power_law_1.2,0.03118079900741577
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,2048,768,8,128,4,16,balanced,0.028783999383449554
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,2048,768,8,128,2,32,power_law_1.2,0.03363839983940124
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,2048,768,8,128,2,32,power_law_1.2,0.03641600012779236
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,2048,768,8,128,4,16,balanced,0.03001066545645396
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,2048,768,8,128,4,16,balanced,0.02976000060637792
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,2048,768,8,128,2,32,power_law_1.2,0.0434112012386322
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,2048,768,8,128,4,16,balanced,0.03512533257404963
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,2048,768,8,128,4,16,balanced,0.029178666571776073
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,2048,768,8,128,4,16,balanced,0.035173334181308746
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,2048,768,8,128,4,16,balanced,0.029663999875386555
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,2048,768,8,128,2,32,power_law_1.2,0.04775680005550385
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,2048,768,8,128,4,16,balanced,0.032085334261258446
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,2048,768,8,128,4,16,balanced,0.037989333271980286
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,2048,768,8,128,2,32,power_law_1.2,0.05687040090560913
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,2048,768,8,128,4,16,balanced,0.03365866591533025
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,2048,768,8,128,2,32,power_law_1.2,0.06780800223350525
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,2048,768,8,128,4,16,balanced,0.040261333187421165
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,2048,768,8,128,4,16,balanced,0.034448000291983284
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,2048,768,8,128,4,16,balanced,0.04262933135032654
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,2048,768,8,128,4,16,balanced,0.034314667185147606
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,2048,768,8,128,2,32,power_law_1.2,0.07800959944725036
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,2048,768,8,128,4,16,balanced,0.03481066723664602
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,2048,768,8,128,2,32,power_law_1.2,0.10640000104904175
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,2048,768,8,128,4,16,balanced,0.04480533301830292
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,2048,768,8,128,4,16,balanced,0.03497066597143809
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,2048,768,8,128,4,16,balanced,0.03549866626660029
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,2048,768,8,128,2,32,power_law_1.2,0.12380160093307495
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,2048,768,8,128,4,16,balanced,0.03545066714286804
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,2048,768,8,128,4,16,balanced,0.049173335234324135
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,2048,768,8,128,4,16,balanced,0.03542399903138479
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,2048,768,8,128,2,32,power_law_1.2,0.1518399953842163
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,2048,768,8,128,4,16,balanced,0.036271999279658
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,2048,768,8,128,4,16,balanced,0.037471999724706016
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,2048,768,8,128,4,16,balanced,0.06070933242638906
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,2048,768,8,128,4,16,balanced,0.02345066765944163
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,2048,768,8,128,2,32,power_law_1.2,0.28739840984344484
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,2048,768,8,128,4,16,balanced,0.0395413339138031
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,2048,768,8,128,4,16,balanced,0.023423999547958374
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,2048,768,8,128,4,16,balanced,0.03899200012286504
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,2048,768,8,128,2,32,power_law_1.2,0.27959039211273196
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,2048,768,8,128,4,16,balanced,0.023978665471076965
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,2048,768,8,128,4,16,balanced,0.06274133423964183
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,2048,768,8,128,4,16,balanced,0.04050666590531667
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,2048,768,8,128,2,32,power_law_1.2,0.5710015773773194
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,2048,768,8,128,4,16,balanced,0.025770666698614757
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,2048,768,8,128,2,32,power_law_1.2,0.767622423171997
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,2048,768,8,128,4,16,balanced,0.02736533433198929
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,2048,768,8,128,4,16,balanced,0.04414399961630503
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,2048,768,8,128,2,32,power_law_1.2,1.1880191802978515
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,2048,768,8,128,4,16,balanced,0.02829333394765854
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,2048,768,8,128,4,16,balanced,0.04515733321507772
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,2048,768,8,128,2,32,power_law_1.2,1.8704767227172852
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,2048,768,8,128,4,16,balanced,0.028064000109831493
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,2048,768,8,128,4,16,balanced,0.08193600177764893
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,2048,768,8,128,4,16,balanced,0.02828799933195114
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,2048,768,8,128,4,16,balanced,0.050106664498647056
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,2048,768,8,128,2,32,power_law_1.2,3.915475082397461
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,2048,768,8,128,4,16,balanced,0.028304000695546467
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,2048,768,8,128,4,16,power_law_1.01,0.025196799635887147
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,2048,768,8,128,4,16,balanced,0.02906133234500885
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,2048,768,8,128,4,16,balanced,0.055344000458717346
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,2048,768,8,128,4,16,balanced,0.029152000943819683
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,2048,768,8,128,4,16,power_law_1.01,0.022387200593948366
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,2048,768,8,128,4,16,balanced,0.03033066789309184
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,2048,768,8,128,4,16,balanced,0.08680533369382222
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,2048,768,8,128,4,16,power_law_1.01,0.021510399878025055
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,2048,768,8,128,4,16,balanced,0.07251733541488647
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,2048,768,8,128,4,16,balanced,0.030741333961486816
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,2048,768,8,128,4,16,power_law_1.01,0.023449599742889404
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,2048,768,8,128,4,16,balanced,0.031173333525657654
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,2048,768,8,128,4,16,power_law_1.01,0.024160000681877136
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,2048,768,8,128,4,16,power_law_1.01,0.026041600108146667
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,2048,768,8,128,4,16,balanced,0.0813920001188914
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,2048,768,8,128,4,16,power_law_1.01,0.02622720003128052
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,2048,768,8,128,4,16,balanced,0.034815999368826546
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,2048,768,8,128,4,16,power_law_1.01,0.036582401394844054
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,2048,768,8,128,4,16,power_law_1.01,0.026649600267410277
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,2048,768,8,128,4,16,balanced,0.03433600068092346
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,2048,768,8,128,4,16,balanced,0.12225066622098286
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,2048,768,8,128,4,16,power_law_1.01,0.029926401376724244
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,2048,768,8,128,4,16,power_law_1.01,0.030995199084281923
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,2048,768,8,128,4,16,balanced,0.10916800300280254
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,2048,768,8,128,4,16,power_law_1.01,0.02958720028400421
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,2048,768,8,128,4,16,power_law_1.01,0.030931198596954347
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,2048,768,8,128,4,16,power_law_1.01,0.03260799944400787
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,2048,768,8,128,4,16,power_law_1.01,0.03278720080852508
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,2048,768,8,128,4,16,power_law_1.01,0.03216640055179596
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,2048,768,8,128,4,16,power_law_1.01,0.033292800188064575
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,2048,768,8,128,4,16,balanced,0.03619199991226196
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,2048,768,8,128,4,16,power_law_1.01,0.03384959995746613
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,2048,768,8,128,4,16,power_law_1.01,0.033344000577926636
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,2048,768,8,128,4,16,balanced,0.1269706686337789
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,2048,768,8,128,4,16,balanced,0.04013866682847341
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,2048,768,8,128,4,16,power_law_1.01,0.040300801396369934
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,2048,768,8,128,4,16,power_law_1.01,0.03378559947013855
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,2048,768,8,128,4,16,balanced,0.04068800061941147
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,2048,768,8,128,4,16,power_law_1.01,0.042419201135635375
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,2048,768,8,128,4,16,power_law_1.01,0.03418239951133728
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,2048,768,8,128,4,16,balanced,0.14414933323860168
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,2048,768,8,128,4,16,power_law_1.01,0.04428800046443939
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,2048,768,8,128,4,16,power_law_1.01,0.03452799916267395
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,2048,768,8,128,4,16,power_law_1.01,0.043007999658584595
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,2048,768,8,128,4,16,power_law_1.01,0.03598720133304596
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,2048,768,8,128,4,16,power_law_1.01,0.05123199820518494
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,2048,768,8,128,4,16,balanced,0.04958933095137278
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,2048,768,8,128,4,16,power_law_1.01,0.03712640106678009
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,2048,768,8,128,4,16,balanced,0.17737066745758057
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,2048,768,8,128,4,16,power_law_1.01,0.04971520006656647
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,2048,768,8,128,4,16,power_law_1.01,0.0367680013179779
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,2048,768,8,128,4,16,balanced,0.054661333560943604
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,2048,768,8,128,4,16,power_law_1.01,0.06423680186271667
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,2048,768,8,128,4,16,power_law_1.01,0.038099199533462524
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,2048,768,8,128,4,16,power_law_1.01,0.07497599720954895
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,2048,768,8,128,4,16,power_law_1.01,0.040268799662590025
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,2048,768,8,128,4,16,power_law_1.01,0.08615040183067321
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,2048,768,8,128,4,16,power_law_1.01,0.04266240000724793
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,2048,768,8,128,4,16,power_law_1.01,0.04555520117282867
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,2048,768,8,128,4,16,power_law_1.01,0.10106240510940552
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,2048,768,8,128,4,16,balanced,0.1692053278287252
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,2048,768,8,128,4,16,balanced,0.07111999889214833
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,2048,768,8,128,4,16,power_law_1.01,0.026054400205612182
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,2048,768,8,128,4,16,power_law_1.01,0.04688639938831329
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,2048,768,8,128,4,16,power_law_1.01,0.12995200157165526
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,2048,768,8,128,4,16,power_law_1.01,0.024198399484157564
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,2048,768,8,128,4,16,balanced,0.2201706568400065
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,2048,768,8,128,4,16,power_law_1.01,0.05193600058555603
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,2048,768,8,128,4,16,power_law_1.01,0.15568000078201294
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,2048,768,8,128,4,16,power_law_1.01,0.023871999979019166
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,2048,768,8,128,4,16,balanced,0.08320533235867818
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,2048,768,8,128,4,16,power_law_1.01,0.05363839864730835
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,2048,768,8,128,4,16,power_law_1.01,0.21563520431518554
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,2048,768,8,128,4,16,power_law_1.01,0.02617599964141846
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,2048,768,8,128,4,16,power_law_1.01,0.06894720196723939
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,2048,768,8,128,4,16,power_law_1.01,0.2801919937133789
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,2048,768,8,128,4,16,power_law_1.01,0.026841598749160766
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,2048,768,8,128,4,16,power_law_1.01,0.07964159846305847
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,2048,768,8,128,4,16,power_law_1.01,0.027980801463127137
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,2048,768,8,128,4,16,power_law_1.01,0.3256959915161133
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,2048,768,8,128,4,16,power_law_1.01,0.09541760087013244
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,2048,768,8,128,4,16,power_law_1.01,0.028352001309394838
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,2048,768,8,128,4,16,power_law_1.01,0.4827904224395752
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,2048,768,8,128,4,16,power_law_1.01,0.1172287940979004
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,2048,768,8,128,4,16,power_law_1.01,0.028921601176261903
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,2048,768,8,128,4,16,balanced,0.11197333534558614
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,2048,768,8,128,4,16,power_law_1.01,0.1601472020149231
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,2048,768,8,128,4,16,power_law_1.01,1.0446975708007813
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,2048,768,8,128,4,16,power_law_1.01,0.029504001140594482
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,2048,768,8,128,4,16,power_law_1.01,0.19211519956588746
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,2048,768,8,128,4,16,power_law_1.01,0.030553600192070006
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,2048,768,8,128,4,16,balanced,0.26311467091242474
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,2048,768,8,128,4,16,power_law_1.01,0.2646336078643799
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,2048,768,8,128,4,16,power_law_1.01,0.03162879943847656
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,2048,768,8,128,4,16,power_law_1.2,0.025222399830818178
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,2048,768,8,128,4,16,power_law_1.01,0.3789184093475342
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,2048,768,8,128,4,16,power_law_1.01,0.032441601157188416
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,2048,768,8,128,4,16,balanced,0.2589919964472453
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,2048,768,8,128,4,16,power_law_1.2,0.021644799411296843
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,2048,768,8,128,4,16,power_law_1.01,0.033139199018478394
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,2048,768,8,128,4,16,power_law_1.01,0.4279488086700439
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,2048,768,8,128,4,16,power_law_1.2,0.021804800629615782
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,2048,768,8,128,4,16,balanced,0.13755200306574503
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,2048,768,8,128,4,16,power_law_1.01,0.03552640080451965
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,2048,768,8,128,4,16,power_law_1.01,0.716326379776001
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,2048,768,8,128,4,16,power_law_1.2,0.023296000063419343
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,2048,768,8,128,4,16,power_law_1.2,0.024089600145816802
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,2048,768,8,128,4,16,power_law_1.01,0.038406398892402646
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,2048,768,8,128,4,16,power_law_1.01,1.3792767524719238
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,2048,768,8,128,4,16,power_law_1.2,0.02600319981575012
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,2048,768,8,128,4,16,power_law_1.01,0.03871360123157501
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,2048,768,8,128,4,16,power_law_1.2,0.026572799682617186
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,2048,768,8,128,4,16,power_law_1.2,0.028972798585891725
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,2048,768,8,128,4,16,balanced,0.20278400182724
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,2048,768,8,128,4,16,power_law_1.01,0.044607999920845035
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,2048,768,8,128,4,16,power_law_1.2,0.03107840120792389
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,2048,768,8,128,4,16,power_law_1.01,0.05128960013389587
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,2048,768,8,128,4,16,power_law_1.2,0.03226880133152008
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,2048,768,8,128,4,16,power_law_1.2,0.0331712007522583
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,2048,768,8,128,4,16,power_law_1.01,0.062067198753356936
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,2048,768,8,128,4,16,balanced,0.40974398454030353
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,2048,768,8,128,4,16,power_law_1.2,0.03336319923400879
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,2048,768,8,128,4,16,power_law_1.01,0.07171199917793274
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,2048,768,8,128,4,16,power_law_1.2,0.03391999900341034
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,2048,768,8,128,4,16,power_law_1.2,0.04014720022678375
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,2048,768,8,128,4,16,power_law_1.01,0.08950399756431579
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,2048,768,8,128,4,16,balanced,0.2708746592203776
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,2048,768,8,128,4,16,power_law_1.2,0.04373759925365448
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,2048,768,8,128,4,16,power_law_1.2,0.04522239863872528
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,2048,768,8,128,4,16,power_law_1.01,0.11445120573043824
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,2048,768,8,128,4,16,power_law_1.2,0.04567039906978607
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,2048,768,8,128,4,16,power_law_1.01,0.15699199438095093
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,2048,768,8,128,4,16,power_law_1.2,0.0561024010181427
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,2048,768,8,128,4,16,power_law_1.2,0.05581439733505249
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,2048,768,8,128,4,16,power_law_1.01,0.22661120891571046
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,2048,768,8,128,4,16,power_law_1.2,0.06632959842681885
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,2048,768,8,128,4,16,power_law_1.2,0.07022719979286193
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,2048,768,8,128,4,16,power_law_1.01,0.2960959911346436
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,2048,768,8,128,4,16,power_law_1.2,0.09363840222358703
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,2048,768,8,128,4,16,power_law_1.2,0.1102336049079895
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,2048,768,8,128,4,16,power_law_1.01,0.4070784091949463
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,2048,768,8,128,4,16,balanced,0.333621342976888
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,2048,768,8,128,4,16,power_law_1.2,0.16176639795303344
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,2048,768,8,128,4,16,power_law_1.01,0.5991040229797363
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,2048,768,8,128,4,16,power_law_1.2,0.1851904034614563
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,2048,768,8,128,4,16,balanced,0.4924693504969279
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,2048,768,8,128,4,16,power_law_1.01,0.6430784225463867
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,2048,768,8,128,4,16,power_law_1.2,0.27393920421600343
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,2048,768,8,128,4,16,power_law_1.01,1.1152128219604491
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,2048,768,8,128,4,16,power_law_1.2,0.40868477821350097
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,2048,768,8,128,4,16,power_law_1.2,0.45740160942077634
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,2048,768,8,128,4,16,power_law_1.01,2.244428825378418
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,2048,768,8,128,4,16,power_law_1.2,0.7418623924255371
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,2048,768,8,128,4,16,power_law_1.2,1.7874176025390625
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,2048,768,8,128,4,16,power_law_1.2,0.03715839982032776
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,2048,768,8,128,4,16,power_law_1.2,0.029791998863220214
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,2048,768,8,128,4,16,balanced,0.7808106740315756
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,2048,768,8,128,4,16,power_law_1.2,0.02956799864768982
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,2048,768,8,128,4,16,balanced,0.5115626653035482
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,2048,768,8,128,4,16,power_law_1.2,0.03158400058746338
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,2048,768,8,128,4,16,power_law_1.2,0.03230080008506775
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,2048,768,8,128,4,16,power_law_1.2,0.034016001224517825
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,2048,768,8,128,4,16,power_law_1.2,0.03361279964447021
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,2048,768,8,128,4,16,power_law_1.2,0.034860798716545106
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,2048,768,8,128,4,16,power_law_1.2,0.03542400002479553
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,2048,768,8,128,4,16,power_law_1.2,0.03594880104064942
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,2048,768,8,128,4,16,power_law_1.2,0.03671680092811584
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,2048,768,8,128,4,16,power_law_1.2,0.0379967987537384
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,2048,768,8,128,4,16,power_law_1.2,0.03827199935913086
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,2048,768,8,128,4,16,power_law_1.2,0.039743998646736146
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,2048,768,8,128,4,16,power_law_1.2,0.04364160001277924
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,2048,768,8,128,4,16,power_law_1.2,0.045849600434303285
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,2048,768,8,128,4,16,power_law_1.2,0.04714879989624023
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,2048,768,8,128,4,16,power_law_1.2,0.056415998935699464
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,2048,768,8,128,4,16,power_law_1.2,0.057817602157592775
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,2048,768,8,128,4,16,power_law_1.2,0.07024639844894409
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,2048,768,8,128,4,16,power_law_1.2,0.08271359801292419
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,2048,768,8,128,4,16,power_law_1.2,0.12449920177459717
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,2048,768,8,128,4,16,power_law_1.2,0.1256384015083313
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,2048,768,8,128,4,16,power_law_1.2,0.183571195602417
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,2048,768,8,128,4,16,power_law_1.2,0.20524799823760986
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,2048,768,8,128,4,16,power_law_1.2,0.3338047981262207
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,2048,768,8,128,4,16,power_law_1.2,0.5403711795806885
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,2048,768,8,128,4,16,power_law_1.2,0.5772736072540283
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,2048,768,8,128,4,16,power_law_1.2,1.0722687721252442
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,2048,768,8,128,4,16,power_law_1.2,2.0811391830444337
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,2048,768,8,128,4,16,balanced,1.0000320275624592
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,2048,768,8,128,4,16,power_law_1.2,0.026035198569297792
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,2048,768,8,128,4,16,power_law_1.2,0.02401279956102371
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,2048,768,8,128,4,16,power_law_1.2,0.024172799289226533
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,2048,768,8,128,4,16,power_law_1.2,0.02643199861049652
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,4096,1536,8,128,1,64,balanced,0.04028266668319702
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,2048,768,8,128,4,16,power_law_1.2,0.0271232008934021
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,4096,1536,8,128,1,64,balanced,0.038880000511805214
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,2048,768,8,128,4,16,power_law_1.2,0.028332799673080444
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,4096,1536,8,128,1,64,balanced,0.03886933376391729
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,4096,1536,8,128,1,64,balanced,0.040549332896868386
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,2048,768,8,128,4,16,power_law_1.2,0.028454399108886717
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,4096,1536,8,128,1,64,balanced,0.0513919989267985
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,2048,768,8,128,4,16,power_law_1.2,0.02900480031967163
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,4096,1536,8,128,1,64,balanced,0.053802669048309326
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,2048,768,8,128,4,16,power_law_1.2,0.030086401104927062
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,4096,1536,8,128,1,64,balanced,0.054101333022117615
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,2048,768,8,128,4,16,power_law_1.2,0.030720001459121703
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,4096,1536,8,128,1,64,balanced,0.05089599887530009
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,2048,768,8,128,4,16,power_law_1.2,0.03192960023880005
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,4096,1536,8,128,1,64,balanced,0.051882664362589516
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,2048,768,8,128,4,16,power_law_1.2,0.03307519853115082
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,4096,1536,8,128,1,64,balanced,0.051455999414126076
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,2048,768,8,128,4,16,power_law_1.2,0.03413119912147522
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,4096,1536,8,128,1,64,balanced,0.05240533252557119
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,4096,1536,8,128,1,64,balanced,0.052746668457984924
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,2048,768,8,128,4,16,power_law_1.2,0.036499199271202085
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,4096,1536,8,128,1,64,balanced,0.052501335740089417
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,2048,768,8,128,4,16,power_law_1.2,0.03930880129337311
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,4096,1536,8,128,1,64,balanced,0.053914666175842285
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,2048,768,8,128,4,16,power_law_1.2,0.04094719886779785
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,4096,1536,8,128,1,64,balanced,0.057909334699312844
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,4096,1536,8,128,1,64,balanced,0.058431997895240784
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,4096,1536,8,128,1,64,balanced,0.05809600154558817
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,2048,768,8,128,4,16,power_law_1.2,0.046911999583244324
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,4096,1536,8,128,1,64,balanced,0.06311466793219249
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,2048,768,8,128,4,16,power_law_1.2,0.05751680135726929
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,4096,1536,8,128,1,64,balanced,0.06178133189678192
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,2048,768,8,128,4,16,power_law_1.2,0.07071359753608704
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,4096,1536,8,128,1,64,balanced,0.07448000212510426
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,2048,768,8,128,4,16,power_law_1.2,0.09288319945335388
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,4096,1536,8,128,1,64,balanced,0.03376533339420954
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,2048,768,8,128,4,16,power_law_1.2,0.10888320207595825
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,4096,1536,8,128,1,64,balanced,0.06869333485762279
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,4096,1536,8,128,1,64,balanced,0.034671999514102936
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,4096,1536,8,128,1,64,balanced,0.03578133384386698
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,2048,768,8,128,4,16,power_law_1.2,0.13861759901046752
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,4096,1536,8,128,1,64,balanced,0.08514666557312012
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,4096,1536,8,128,1,64,balanced,0.036746665835380554
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,2048,768,8,128,4,16,power_law_1.2,0.1644927978515625
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,4096,1536,8,128,1,64,balanced,0.0412266676624616
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,4096,1536,8,128,1,64,balanced,0.04081599911053976
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,4096,1536,8,128,1,64,balanced,0.08858666817347209
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,2048,768,8,128,4,16,power_law_1.2,0.23732481002807618
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,4096,1536,8,128,1,64,balanced,0.040463998913764954
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,4096,1536,8,128,1,64,balanced,0.04016000032424927
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,2048,768,8,128,4,16,power_law_1.2,0.2870016098022461
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,4096,1536,8,128,1,64,balanced,0.040362666050593056
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,4096,1536,8,128,1,64,balanced,0.11961066722869873
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,2048,768,8,128,4,16,power_law_1.2,0.6044352054595947
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,4096,1536,8,128,1,64,balanced,0.040965333580970764
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,4096,1536,8,128,1,64,power_law_1.01,0.04774399995803833
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,4096,1536,8,128,1,64,balanced,0.04195733368396759
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,2048,768,8,128,4,16,power_law_1.2,0.696134376525879
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,4096,1536,8,128,1,64,power_law_1.01,0.045952001214027406
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,4096,1536,8,128,1,64,balanced,0.04188799858093262
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,4096,1536,8,128,1,64,power_law_1.01,0.041196799278259276
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,2048,768,8,128,4,16,power_law_1.2,1.0274111747741699
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,4096,1536,8,128,1,64,balanced,0.045253331462542214
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,4096,1536,8,128,1,64,power_law_1.01,0.0505407989025116
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,4096,1536,8,128,1,64,power_law_1.01,0.050892800092697144
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,4096,1536,8,128,1,64,balanced,0.0450133333603541
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,2048,768,8,128,4,16,power_law_1.2,2.0744064331054686
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,4096,1536,8,128,1,64,balanced,0.12418666481971741
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,4096,1536,8,128,1,64,power_law_1.01,0.05203199982643127
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,4096,1536,8,128,1,64,balanced,0.04709866642951965
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,4096,1536,8,128,1,64,power_law_1.01,0.05249279737472534
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,2048,768,8,128,4,16,power_law_1.2,3.3368896484375
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,4096,1536,8,128,1,64,balanced,0.047653332352638245
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,4096,1536,8,128,1,64,power_law_1.01,0.05173119902610779
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,4096,1536,8,128,1,64,power_law_1.01,0.053395199775695804
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,4096,1536,8,128,1,64,balanced,0.05227733155091604
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,4096,1536,8,128,1,64,balanced,0.027658666173617046
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,4096,1536,8,128,1,64,power_law_1.01,0.05422080159187317
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,4096,1536,8,128,1,64,power_law_1.01,0.03642880022525787
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,4096,1536,8,128,1,64,power_law_1.01,0.05727999806404114
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,4096,1536,8,128,1,64,balanced,0.05898133416970571
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,4096,1536,8,128,1,64,balanced,0.027727998793125153
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,4096,1536,8,128,1,64,power_law_1.01,0.06398079991340637
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,4096,1536,8,128,1,64,balanced,0.027850667635599773
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,4096,1536,8,128,1,64,power_law_1.01,0.036294400691986084
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,4096,1536,8,128,1,64,power_law_1.01,0.07212160229682922
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,4096,1536,8,128,1,64,balanced,0.18892266352971396
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,4096,1536,8,128,1,64,balanced,0.061797335743904114
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,4096,1536,8,128,1,64,power_law_1.01,0.06730239987373351
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,4096,1536,8,128,1,64,balanced,0.029135999580224354
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,4096,1536,8,128,1,64,power_law_1.01,0.03704319894313812
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,4096,1536,8,128,1,64,power_law_1.01,0.07719680070877075
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,4096,1536,8,128,1,64,balanced,0.07239466905593872
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,4096,1536,8,128,1,64,balanced,0.034245334565639496
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,4096,1536,8,128,1,64,power_law_1.01,0.04014720022678375
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,4096,1536,8,128,1,64,power_law_1.01,0.08844159841537476
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,4096,1536,8,128,1,64,power_law_1.01,0.08639360070228577
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,4096,1536,8,128,1,64,balanced,0.034485332667827606
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,4096,1536,8,128,1,64,power_law_1.01,0.04056960046291351
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,4096,1536,8,128,1,64,power_law_1.01,0.11545599699020385
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,4096,1536,8,128,1,64,balanced,0.07854933540026347
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,4096,1536,8,128,1,64,balanced,0.03483733286460241
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,4096,1536,8,128,1,64,power_law_1.01,0.03933440148830414
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,4096,1536,8,128,1,64,power_law_1.01,0.11090559959411621
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,4096,1536,8,128,1,64,power_law_1.01,0.14161920547485352
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,4096,1536,8,128,1,64,balanced,0.034474665919939675
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,4096,1536,8,128,1,64,power_law_1.01,0.03963519930839539
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,4096,1536,8,128,1,64,power_law_1.01,0.15361920595169068
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,4096,1536,8,128,1,64,balanced,0.0941973328590393
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,4096,1536,8,128,1,64,power_law_1.01,0.04010240137577057
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,4096,1536,8,128,1,64,balanced,0.0341386670867602
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,4096,1536,8,128,1,64,power_law_1.01,0.19545600414276124
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,4096,1536,8,128,1,64,balanced,0.21259733041127524
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,4096,1536,8,128,1,64,power_law_1.01,0.042284798622131345
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,4096,1536,8,128,1,64,balanced,0.03641066700220108
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,4096,1536,8,128,1,64,power_law_1.01,0.20074880123138428
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,4096,1536,8,128,1,64,power_law_1.01,0.34279680252075195
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,4096,1536,8,128,1,64,power_law_1.01,0.0430400013923645
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,4096,1536,8,128,1,64,balanced,0.03573333223660787
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,4096,1536,8,128,1,64,balanced,0.10804266730944316
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,4096,1536,8,128,1,64,power_law_1.01,0.41809282302856443
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,4096,1536,8,128,1,64,power_law_1.01,0.044684800505638125
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,4096,1536,8,128,1,64,balanced,0.035071998834609985
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,4096,1536,8,128,1,64,power_law_1.01,0.5825664043426514
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,4096,1536,8,128,1,64,power_law_1.01,0.04762240052223206
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,4096,1536,8,128,1,64,balanced,0.03584533433119456
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,4096,1536,8,128,1,64,power_law_1.01,0.7196991920471192
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,4096,1536,8,128,1,64,power_law_1.01,0.050374400615692136
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,4096,1536,8,128,1,64,balanced,0.03696000079313914
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,4096,1536,8,128,1,64,power_law_1.01,0.9547264099121093
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,4096,1536,8,128,1,64,balanced,0.1437173287073771
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,4096,1536,8,128,1,64,power_law_1.01,0.05084159970283508
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,4096,1536,8,128,1,64,balanced,0.04113066693147024
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,4096,1536,8,128,1,64,power_law_1.01,1.7635200500488282
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,4096,1536,8,128,1,64,power_law_1.01,0.0598143994808197
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,4096,1536,8,128,1,64,balanced,0.042175998290379844
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,4096,1536,8,128,1,64,power_law_1.01,3.2293441772460936
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,4096,1536,8,128,1,64,power_law_1.01,0.06232320070266724
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,4096,1536,8,128,1,64,power_law_1.01,0.06497920155525208
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,4096,1536,8,128,1,64,balanced,0.23607999086380005
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,4096,1536,8,128,1,64,balanced,0.16765334208806357
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,4096,1536,8,128,1,64,power_law_1.01,0.08140159845352173
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,4096,1536,8,128,1,64,power_law_1.01,0.08444160223007202
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,4096,1536,8,128,1,64,power_law_1.01,0.10962560176849365
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,4096,1536,8,128,1,64,power_law_1.2,0.047577598690986635
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,4096,1536,8,128,1,64,power_law_1.01,0.11786880493164062
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,4096,1536,8,128,1,64,balanced,0.04192000130812327
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,4096,1536,8,128,1,64,power_law_1.01,0.16159360408782958
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,4096,1536,8,128,1,64,power_law_1.2,0.04199039936065674
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,4096,1536,8,128,1,64,balanced,0.048341333866119385
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,4096,1536,8,128,1,64,power_law_1.01,0.1992576003074646
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,4096,1536,8,128,1,64,balanced,0.24342399835586548
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,4096,1536,8,128,1,64,power_law_1.01,0.028537601232528687
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,4096,1536,8,128,1,64,power_law_1.2,0.04364160001277924
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,4096,1536,8,128,1,64,balanced,0.05091199775536855
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,4096,1536,8,128,1,64,power_law_1.01,0.2839423894882202
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,4096,1536,8,128,1,64,power_law_1.2,0.05015680193901062
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,4096,1536,8,128,1,64,power_law_1.01,0.0281792014837265
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,4096,1536,8,128,1,64,power_law_1.01,0.028255999088287354
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,4096,1536,8,128,1,64,power_law_1.01,0.3374399900436401
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,4096,1536,8,128,1,64,power_law_1.2,0.05090559720993042
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,4096,1536,8,128,1,64,power_law_1.01,0.03126400113105774
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,4096,1536,8,128,1,64,power_law_1.2,0.052223998308181765
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,4096,1536,8,128,1,64,power_law_1.01,0.5675648212432861
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,4096,1536,8,128,1,64,power_law_1.01,0.03175039887428284
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,4096,1536,8,128,1,64,power_law_1.2,0.052876800298690796
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,4096,1536,8,128,1,64,power_law_1.01,0.6535935878753663
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,4096,1536,8,128,1,64,power_law_1.01,0.03273600041866302
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,4096,1536,8,128,1,64,power_law_1.2,0.05308160185813904
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,4096,1536,8,128,1,64,power_law_1.01,0.9757247924804687
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,4096,1536,8,128,1,64,balanced,0.05979733169078827
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,4096,1536,8,128,1,64,power_law_1.01,0.032390400767326355
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,4096,1536,8,128,1,64,power_law_1.2,0.05434880256652832
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,4096,1536,8,128,1,64,balanced,0.29603733619054157
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,4096,1536,8,128,1,64,balanced,0.3388426701227824
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,4096,1536,8,128,1,64,power_law_1.01,0.03288320004940033
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,4096,1536,8,128,1,64,power_law_1.2,0.05482239723205566
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,4096,1536,8,128,1,64,power_law_1.01,1.2064831733703614
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,4096,1536,8,128,1,64,balanced,0.06392000118891399
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,4096,1536,8,128,1,64,power_law_1.01,0.033548799157142636
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,4096,1536,8,128,1,64,power_law_1.2,0.061459201574325564
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,4096,1536,8,128,1,64,power_law_1.01,2.7146495819091796
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,4096,1536,8,128,1,64,power_law_1.01,0.036671999096870425
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,4096,1536,8,128,1,64,power_law_1.2,0.0673792004585266
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,4096,1536,8,128,1,64,power_law_1.01,0.044300800561904906
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,4096,1536,8,128,1,64,power_law_1.2,0.07118719816207886
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,4096,1536,8,128,1,64,power_law_1.01,0.04696959853172302
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,4096,1536,8,128,1,64,power_law_1.2,0.07463679909706115
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,4096,1536,8,128,1,64,balanced,0.07880533238252004
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,4096,1536,8,128,1,64,power_law_1.01,0.05076479911804199
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,4096,1536,8,128,1,64,power_law_1.2,0.09055359959602356
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,4096,1536,8,128,1,64,power_law_1.01,0.0531391978263855
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,4096,1536,8,128,1,64,power_law_1.2,0.09595519900321961
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,4096,1536,8,128,1,64,balanced,0.34727998574574787
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,4096,1536,8,128,1,64,power_law_1.01,0.05847039818763733
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,4096,1536,8,128,1,64,balanced,0.08780266841252644
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,4096,1536,8,128,1,64,power_law_1.2,0.0978879988193512
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,4096,1536,8,128,1,64,power_law_1.01,0.07025920152664185
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,4096,1536,8,128,1,64,power_law_1.2,0.13114240169525146
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,4096,1536,8,128,1,64,power_law_1.2,0.13080960512161255
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,4096,1536,8,128,1,64,power_law_1.01,0.0632960021495819
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,4096,1536,8,128,1,64,power_law_1.2,0.17496320009231567
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,4096,1536,8,128,1,64,power_law_1.01,0.08606719970703125
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,4096,1536,8,128,1,64,power_law_1.2,0.20013439655303955
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,4096,1536,8,128,1,64,power_law_1.2,0.26156799793243407
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,4096,1536,8,128,1,64,power_law_1.01,0.1075711965560913
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,4096,1536,8,128,1,64,power_law_1.2,0.32641921043395994
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,4096,1536,8,128,1,64,balanced,0.1188213328520457
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,4096,1536,8,128,1,64,power_law_1.2,0.5409088134765625
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,4096,1536,8,128,1,64,power_law_1.2,0.5479296207427978
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,4096,1536,8,128,1,64,power_law_1.01,0.12154879570007324
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,4096,1536,8,128,1,64,power_law_1.2,0.8568256378173829
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,4096,1536,8,128,1,64,power_law_1.01,0.1543552041053772
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,4096,1536,8,128,1,64,power_law_1.2,1.3981375694274902
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,4096,1536,8,128,1,64,balanced,0.14270400007565817
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,4096,1536,8,128,1,64,power_law_1.2,1.801740837097168
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,4096,1536,8,128,1,64,balanced,0.525056004524231
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,4096,1536,8,128,1,64,power_law_1.01,0.1660416007041931
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,4096,1536,8,128,1,64,power_law_1.2,3.55230712890625
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,4096,1536,8,128,1,64,power_law_1.01,0.2757055997848511
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,4096,1536,8,128,1,64,power_law_1.2,7.113260650634766
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,4096,1536,8,128,1,64,power_law_1.01,0.417299222946167
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,4096,1536,8,128,1,64,balanced,0.6420906782150269
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,4096,1536,8,128,1,64,balanced,0.19951466719309488
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,4096,1536,8,128,1,64,power_law_1.01,0.47507200241088865
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,4096,1536,8,128,1,64,power_law_1.01,0.7429696083068847
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,4096,1536,8,128,1,64,power_law_1.01,1.1748415946960449
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,4096,1536,8,128,1,64,balanced,0.25279466311136883
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,4096,1536,8,128,1,64,power_law_1.01,1.4082367897033692
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,4096,1536,8,128,1,64,power_law_1.01,1.83240966796875
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,4096,1536,8,128,1,64,power_law_1.01,4.327923202514649
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,4096,1536,8,128,1,64,power_law_1.2,0.03653120100498199
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,4096,1536,8,128,1,64,power_law_1.2,0.03504000008106232
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,4096,1536,8,128,1,64,balanced,0.31385600566864014
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,4096,1536,8,128,1,64,power_law_1.2,0.036211198568344115
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,4096,1536,8,128,1,64,power_law_1.2,0.03925760090351105
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,4096,1536,8,128,1,64,power_law_1.2,0.04008319973945618
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,4096,1536,8,128,1,64,balanced,1.0097333590189617
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,4096,1536,8,128,1,64,power_law_1.2,0.03948160111904144
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,4096,1536,8,128,1,64,power_law_1.2,0.03957119882106781
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,4096,1536,8,128,1,64,power_law_1.2,0.04154239892959595
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,4096,1536,8,128,1,64,power_law_1.2,0.043263998627662656
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,4096,1536,8,128,1,64,power_law_1.2,0.042668798565864564
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,4096,1536,8,128,1,64,power_law_1.2,0.044940799474716187
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,4096,1536,8,128,1,64,power_law_1.2,0.049209600687026976
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,4096,1536,8,128,1,64,power_law_1.2,0.052851200103759766
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,4096,1536,8,128,1,64,power_law_1.2,0.05568640232086182
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,4096,1536,8,128,1,64,balanced,0.5012693405151367
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,4096,1536,8,128,1,64,power_law_1.2,0.06214399933815003
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,4096,1536,8,128,1,64,power_law_1.2,0.06531199812889099
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,4096,1536,8,128,1,64,power_law_1.2,0.06764159798622131
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,4096,1536,8,128,1,64,power_law_1.2,0.08747519850730896
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,4096,1536,8,128,1,64,power_law_1.2,0.11088639497756958
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,4096,1536,8,128,1,64,power_law_1.2,0.13823360204696655
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,4096,1536,8,128,1,64,power_law_1.2,0.13526400327682495
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,4096,1536,8,128,1,64,power_law_1.2,0.19329919815063476
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,4096,1536,8,128,1,64,power_law_1.2,0.02996479868888855
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,4096,1536,8,128,1,64,power_law_1.2,0.2465087890625
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,4096,1536,8,128,1,64,power_law_1.2,0.028166401386260986
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,4096,1536,8,128,1,64,power_law_1.2,0.39385600090026857
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,4096,1536,8,128,1,64,power_law_1.2,0.029824000597000123
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,4096,1536,8,128,1,64,power_law_1.2,0.03260799944400787
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,4096,1536,8,128,1,64,power_law_1.2,0.4641024112701416
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,4096,1536,8,128,1,64,power_law_1.2,0.03311359882354736
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,4096,1536,8,128,1,64,power_law_1.2,0.03392640054225922
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,4096,1536,8,128,1,64,power_law_1.2,0.7545023918151855
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,4096,1536,8,128,1,64,power_law_1.2,0.03361279964447021
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,4096,1536,8,128,1,64,power_law_1.2,0.9364543914794922
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,4096,1536,8,128,1,64,power_law_1.2,0.03570559918880463
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,4096,1536,8,128,1,64,power_law_1.2,0.0355648010969162
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,4096,1536,8,128,1,64,power_law_1.2,1.1554304122924806
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,4096,1536,8,128,1,64,power_law_1.2,0.03749119937419891
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,4096,1536,8,128,1,64,power_law_1.2,0.046649599075317384
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,4096,1536,8,128,1,64,power_law_1.2,2.5100608825683595
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,4096,1536,8,128,1,64,power_law_1.2,0.047916799783706665
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,4096,1536,8,128,1,64,power_law_1.2,0.05123839974403381
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,4096,1536,8,128,1,64,power_law_1.2,5.187955093383789
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,4096,1536,8,128,1,64,power_law_1.2,0.05469440221786499
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,4096,1536,8,128,1,64,power_law_1.2,0.06588799953460693
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,4096,1536,8,128,1,64,power_law_1.2,0.06958079934120179
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,4096,1536,8,128,2,32,balanced,0.034234667817751564
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,4096,1536,8,128,2,32,balanced,0.03427733232577642
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,4096,1536,8,128,1,64,power_law_1.2,0.07279360294342041
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,4096,1536,8,128,2,32,balanced,0.03421866645415624
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,4096,1536,8,128,1,64,power_law_1.2,0.09746559858322143
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,4096,1536,8,128,1,64,power_law_1.2,0.1271999955177307
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,4096,1536,8,128,2,32,balanced,0.039919999738534294
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,4096,1536,8,128,2,32,balanced,0.050954664746920265
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,4096,1536,8,128,1,64,power_law_1.2,0.16432640552520753
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,4096,1536,8,128,2,32,balanced,0.05129066606362661
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,4096,1536,8,128,1,64,balanced,0.9887786706288656
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,4096,1536,8,128,1,64,power_law_1.2,0.18910720348358154
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,4096,1536,8,128,2,32,balanced,0.05075199902057648
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,4096,1536,8,128,1,64,power_law_1.2,0.2309119939804077
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,4096,1536,8,128,2,32,balanced,0.05039466420809428
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,4096,1536,8,128,1,64,power_law_1.2,0.41637120246887205
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,4096,1536,8,128,2,32,balanced,0.051029334465662636
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,4096,1536,8,128,2,32,balanced,0.05116266508897146
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,4096,1536,8,128,2,32,balanced,0.05202666421731313
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,4096,1536,8,128,1,64,power_law_1.2,0.562943983078003
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,4096,1536,8,128,2,32,balanced,0.05256533126036326
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,4096,1536,8,128,1,64,power_law_1.2,0.8556672096252441
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,4096,1536,8,128,2,32,balanced,0.05258666475613912
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,4096,1536,8,128,1,64,power_law_1.2,1.180281639099121
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,4096,1536,8,128,1,64,power_law_1.2,1.6702592849731446
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,4096,1536,8,128,2,32,balanced,0.05569066603978475
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,4096,1536,8,128,2,32,balanced,0.05682666599750519
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,4096,1536,8,128,1,64,power_law_1.2,2.2692096710205076
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,4096,1536,8,128,2,32,balanced,0.05870933334032694
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,4096,1536,8,128,1,64,power_law_1.2,3.845119857788086
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,4096,1536,8,128,2,32,balanced,0.0580320010582606
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,4096,1536,8,128,1,64,power_law_1.2,8.001702117919923
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,4096,1536,8,128,2,32,balanced,0.0676746666431427
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,4096,1536,8,128,2,32,balanced,0.06242666641871134
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,4096,1536,8,128,2,32,balanced,0.035418666899204254
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,4096,1536,8,128,2,32,balanced,0.07409066458543141
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,4096,1536,8,128,2,32,balanced,0.03487999985615412
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,4096,1536,8,128,2,32,balanced,0.03437866767247518
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,4096,1536,8,128,2,32,balanced,0.07025599976380666
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,4096,1536,8,128,2,32,balanced,0.03518400092919668
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,4096,1536,8,128,2,32,balanced,0.038319999972979225
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,4096,1536,8,128,2,32,balanced,0.0869599978129069
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,4096,1536,8,128,2,32,balanced,0.039359999199708305
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,4096,1536,8,128,2,32,balanced,0.03924266745646795
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,4096,1536,8,128,2,32,balanced,0.039546666045983635
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,4096,1536,8,128,2,32,balanced,0.0271573339899381
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,4096,1536,8,128,2,32,balanced,0.09047466516494751
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,4096,1536,8,128,2,32,balanced,0.03951466580231985
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,4096,1536,8,128,2,32,balanced,0.02741333345572154
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,4096,1536,8,128,2,32,balanced,0.04036800066630045
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,4096,1536,8,128,2,32,balanced,0.027424000203609467
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,4096,1536,8,128,2,32,balanced,0.04072533299525579
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,4096,1536,8,128,2,32,balanced,0.029066666960716248
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,4096,1536,8,128,2,32,balanced,0.033333333830038704
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,4096,1536,8,128,2,32,balanced,0.1277653376261393
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,4096,1536,8,128,2,32,balanced,0.04104000081618627
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,4096,1536,8,128,2,32,balanced,0.03392533212900162
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,4096,1536,8,128,2,32,balanced,0.043194666504859924
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,4096,1536,8,128,2,32,balanced,0.03480533262093862
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,4096,1536,8,128,2,32,balanced,0.04435733457406362
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,4096,1536,8,128,2,32,balanced,0.03376533339420954
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,4096,1536,8,128,2,32,balanced,0.033733333150545754
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,4096,1536,8,128,2,32,balanced,0.04696533580621084
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,4096,1536,8,128,2,32,power_law_1.01,0.04684160053730011
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,4096,1536,8,128,2,32,balanced,0.13271466890970865
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,4096,1536,8,128,2,32,balanced,0.03579733272393545
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,4096,1536,8,128,2,32,balanced,0.04683200021584829
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,4096,1536,8,128,2,32,balanced,0.03428266694148382
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,4096,1536,8,128,2,32,power_law_1.01,0.039468801021575926
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,4096,1536,8,128,2,32,balanced,0.05077866713205973
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,4096,1536,8,128,2,32,balanced,0.03540800015131632
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,4096,1536,8,128,2,32,power_law_1.01,0.039078399538993835
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,4096,1536,8,128,2,32,balanced,0.038015998899936676
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,4096,1536,8,128,2,32,balanced,0.06193066636721293
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,4096,1536,8,128,2,32,power_law_1.01,0.043968001008033754
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,4096,1536,8,128,2,32,balanced,0.036831999818483986
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,4096,1536,8,128,2,32,power_law_1.01,0.04534400105476379
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,4096,1536,8,128,2,32,balanced,0.061797335743904114
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,4096,1536,8,128,2,32,balanced,0.2023893396059672
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,4096,1536,8,128,2,32,power_law_1.01,0.04881280064582825
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,4096,1536,8,128,2,32,balanced,0.07372800012429555
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,4096,1536,8,128,2,32,power_law_1.01,0.03935999870300293
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,4096,1536,8,128,2,32,balanced,0.04345066845417023
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,4096,1536,8,128,2,32,power_law_1.01,0.05006719827651977
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,4096,1536,8,128,2,32,balanced,0.04419733087221781
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,4096,1536,8,128,2,32,power_law_1.01,0.038201600313186646
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,4096,1536,8,128,2,32,power_law_1.01,0.05004159808158874
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,4096,1536,8,128,2,32,balanced,0.07964266836643219
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,4096,1536,8,128,2,32,power_law_1.01,0.03522560000419617
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,4096,1536,8,128,2,32,power_law_1.01,0.05203199982643127
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,4096,1536,8,128,2,32,power_law_1.01,0.05251200199127197
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,4096,1536,8,128,2,32,power_law_1.01,0.03635840117931366
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,4096,1536,8,128,2,32,balanced,0.09898133079210918
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,4096,1536,8,128,2,32,power_law_1.01,0.03612160086631775
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,4096,1536,8,128,2,32,power_law_1.01,0.054476797580718994
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,4096,1536,8,128,2,32,power_law_1.01,0.05865600109100342
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,4096,1536,8,128,2,32,power_law_1.01,0.038899201154708865
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,4096,1536,8,128,2,32,balanced,0.2355466683705648
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,4096,1536,8,128,2,32,balanced,0.04586666822433472
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,4096,1536,8,128,2,32,balanced,0.11103999614715576
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,4096,1536,8,128,2,32,power_law_1.01,0.06109439730644226
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,4096,1536,8,128,2,32,power_law_1.01,0.03834240138530731
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,4096,1536,8,128,2,32,balanced,0.05197866757710775
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,4096,1536,8,128,2,32,power_law_1.01,0.06350079774856568
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,4096,1536,8,128,2,32,power_law_1.01,0.0401856005191803
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,4096,1536,8,128,2,32,power_law_1.01,0.04213759899139404
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,4096,1536,8,128,2,32,power_law_1.01,0.06729599833488464
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,4096,1536,8,128,2,32,balanced,0.05579733351866404
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,4096,1536,8,128,2,32,balanced,0.15413866440455118
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,4096,1536,8,128,2,32,power_law_1.01,0.04429439902305603
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,4096,1536,8,128,2,32,power_law_1.01,0.07347840070724487
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,4096,1536,8,128,2,32,power_law_1.01,0.04462080001831055
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,4096,1536,8,128,2,32,power_law_1.01,0.08098559975624084
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,4096,1536,8,128,2,32,power_law_1.01,0.0979968011379242
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,4096,1536,8,128,2,32,power_law_1.01,0.04767360091209412
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,4096,1536,8,128,2,32,balanced,0.06523199876149495
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,4096,1536,8,128,2,32,power_law_1.01,0.0976639986038208
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,4096,1536,8,128,2,32,power_law_1.01,0.050323200225830075
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,4096,1536,8,128,2,32,balanced,0.17983466386795044
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,4096,1536,8,128,2,32,balanced,0.07204266885916392
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,4096,1536,8,128,2,32,power_law_1.01,0.12620160579681397
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,4096,1536,8,128,2,32,power_law_1.01,0.05258880257606506
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,4096,1536,8,128,2,32,balanced,0.3018453319867452
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,4096,1536,8,128,2,32,power_law_1.01,0.057715201377868654
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,4096,1536,8,128,2,32,power_law_1.01,0.13300479650497438
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,4096,1536,8,128,2,32,power_law_1.01,0.17185280323028565
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,4096,1536,8,128,2,32,power_law_1.01,0.05917440056800842
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,4096,1536,8,128,2,32,power_law_1.01,0.18625919818878173
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,4096,1536,8,128,2,32,power_law_1.01,0.06537600159645081
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,4096,1536,8,128,2,32,power_law_1.01,0.08144639730453491
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,4096,1536,8,128,2,32,power_law_1.01,0.2473151922225952
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,4096,1536,8,128,2,32,balanced,0.09175999959309895
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,4096,1536,8,128,2,32,power_law_1.01,0.08383359909057617
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,4096,1536,8,128,2,32,balanced,0.264138658841451
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,4096,1536,8,128,2,32,power_law_1.01,0.31297280788421633
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,4096,1536,8,128,2,32,power_law_1.01,0.10092799663543701
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,4096,1536,8,128,2,32,power_law_1.01,0.4625279903411865
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,4096,1536,8,128,2,32,balanced,0.10316266616185506
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,4096,1536,8,128,2,32,power_law_1.01,0.11219199895858764
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,4096,1536,8,128,2,32,power_law_1.01,0.586732816696167
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,4096,1536,8,128,2,32,power_law_1.01,0.15615999698638916
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,4096,1536,8,128,2,32,power_law_1.01,0.1868288040161133
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,4096,1536,8,128,2,32,power_law_1.01,0.6766335964202881
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,4096,1536,8,128,2,32,power_law_1.01,0.2571712017059326
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,4096,1536,8,128,2,32,power_law_1.01,1.3083647727966308
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,4096,1536,8,128,2,32,power_law_1.01,0.32692480087280273
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,4096,1536,8,128,2,32,power_law_1.01,0.5009856224060059
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,4096,1536,8,128,2,32,balanced,0.14244266351064047
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,4096,1536,8,128,2,32,power_law_1.01,2.3036544799804686
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,4096,1536,8,128,2,32,balanced,0.3236853281656901
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,4096,1536,8,128,2,32,power_law_1.01,0.5874688148498535
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,4096,1536,8,128,2,32,balanced,0.3882559935251872
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,4096,1536,8,128,2,32,power_law_1.01,0.6822591781616211
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,4096,1536,8,128,2,32,power_law_1.01,1.1297663688659667
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,4096,1536,8,128,2,32,balanced,0.17439999183019003
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,4096,1536,8,128,2,32,power_law_1.01,3.1793472290039064
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,4096,1536,8,128,2,32,power_law_1.01,0.03113600015640259
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,4096,1536,8,128,2,32,power_law_1.01,0.02932479977607727
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,4096,1536,8,128,2,32,power_law_1.2,0.047116801142692566
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,4096,1536,8,128,2,32,power_law_1.01,0.028384000062942505
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,4096,1536,8,128,2,32,balanced,0.38465599219004315
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,4096,1536,8,128,2,32,balanced,0.25600000222524005
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,4096,1536,8,128,2,32,power_law_1.01,0.03175680041313171
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,4096,1536,8,128,2,32,power_law_1.2,0.03969280123710632
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,4096,1536,8,128,2,32,power_law_1.01,0.03209599852561951
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,4096,1536,8,128,2,32,power_law_1.2,0.041631999611854556
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,4096,1536,8,128,2,32,power_law_1.01,0.03386240005493164
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,4096,1536,8,128,2,32,power_law_1.01,0.03386879861354828
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,4096,1536,8,128,2,32,power_law_1.2,0.046105599403381346
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,4096,1536,8,128,2,32,power_law_1.01,0.035104000568389894
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,4096,1536,8,128,2,32,power_law_1.2,0.04407039880752563
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,4096,1536,8,128,2,32,power_law_1.2,0.047219198942184445
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,4096,1536,8,128,2,32,power_law_1.01,0.038406398892402646
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,4096,1536,8,128,2,32,power_law_1.2,0.05017600059509277
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,4096,1536,8,128,2,32,balanced,0.34031999111175537
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,4096,1536,8,128,2,32,power_law_1.01,0.03798399865627289
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,4096,1536,8,128,2,32,power_law_1.2,0.05251839756965637
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,4096,1536,8,128,2,32,power_law_1.2,0.05335680246353149
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,4096,1536,8,128,2,32,power_law_1.01,0.039654400944709775
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,4096,1536,8,128,2,32,power_law_1.2,0.05434880256652832
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,4096,1536,8,128,2,32,power_law_1.01,0.04201599955558777
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,4096,1536,8,128,2,32,power_law_1.2,0.056979197263717654
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,4096,1536,8,128,2,32,power_law_1.01,0.04721280038356781
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,4096,1536,8,128,2,32,power_law_1.2,0.05976319909095764
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,4096,1536,8,128,2,32,power_law_1.01,0.05261440277099609
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,4096,1536,8,128,2,32,power_law_1.2,0.06488320231437683
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,4096,1536,8,128,2,32,power_law_1.2,0.06546559929847717
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,4096,1536,8,128,2,32,power_law_1.01,0.05782399773597717
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,4096,1536,8,128,2,32,power_law_1.2,0.04074879884719849
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,4096,1536,8,128,2,32,balanced,0.5876853466033936
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,4096,1536,8,128,2,32,power_law_1.2,0.07212799787521362
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,4096,1536,8,128,2,32,power_law_1.01,0.06027519702911377
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,4096,1536,8,128,2,32,power_law_1.2,0.07983360290527344
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,4096,1536,8,128,2,32,power_law_1.2,0.03500800132751465
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,4096,1536,8,128,2,32,power_law_1.2,0.08850560188293458
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,4096,1536,8,128,2,32,power_law_1.01,0.06398079991340637
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,4096,1536,8,128,2,32,power_law_1.2,0.03518719971179962
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,4096,1536,8,128,2,32,power_law_1.2,0.10951039791107178
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,4096,1536,8,128,2,32,power_law_1.01,0.08018559813499451
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,4096,1536,8,128,2,32,power_law_1.2,0.035897600650787356
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,4096,1536,8,128,2,32,balanced,0.7533226807912191
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,4096,1536,8,128,2,32,power_law_1.01,0.09363840222358703
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,4096,1536,8,128,2,32,power_law_1.2,0.1040768027305603
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,4096,1536,8,128,2,32,power_law_1.2,0.0367680013179779
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,4096,1536,8,128,2,32,balanced,0.42633601029713947
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,4096,1536,8,128,2,32,power_law_1.2,0.14099199771881105
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,4096,1536,8,128,2,32,power_law_1.2,0.03882879912853241
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,4096,1536,8,128,2,32,power_law_1.01,0.11295360326766968
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,4096,1536,8,128,2,32,power_law_1.01,0.14586880207061767
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,4096,1536,8,128,2,32,power_law_1.2,0.03868800103664398
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,4096,1536,8,128,2,32,power_law_1.2,0.13352960348129272
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,4096,1536,8,128,2,32,power_law_1.2,0.04252159893512726
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,4096,1536,8,128,2,32,power_law_1.2,0.20826880931854247
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,4096,1536,8,128,2,32,power_law_1.01,0.18133120536804198
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,4096,1536,8,128,2,32,power_law_1.2,0.043680000305175784
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,4096,1536,8,128,2,32,power_law_1.01,0.2792191982269287
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,4096,1536,8,128,2,32,power_law_1.2,0.23407359123229982
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,4096,1536,8,128,2,32,power_law_1.2,0.04379520118236542
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,4096,1536,8,128,2,32,power_law_1.2,0.32182400226593016
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,4096,1536,8,128,2,32,power_law_1.01,0.4050623893737793
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,4096,1536,8,128,2,32,power_law_1.2,0.04672000110149384
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,4096,1536,8,128,2,32,power_law_1.01,0.49214720726013184
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,4096,1536,8,128,2,32,power_law_1.2,0.48188161849975586
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,4096,1536,8,128,2,32,power_law_1.2,0.046700799465179445
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,4096,1536,8,128,2,32,power_law_1.01,0.6571839809417724
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,4096,1536,8,128,2,32,power_law_1.2,0.7425983905792236
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,4096,1536,8,128,2,32,power_law_1.2,0.05023360252380371
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,4096,1536,8,128,2,32,power_law_1.01,0.9438976287841797
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,4096,1536,8,128,2,32,power_law_1.2,0.05359359979629517
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,4096,1536,8,128,2,32,power_law_1.2,1.115552043914795
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,4096,1536,8,128,2,32,power_law_1.01,1.3011967658996582
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,4096,1536,8,128,2,32,power_law_1.2,0.05796480178833008
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,4096,1536,8,128,2,32,power_law_1.2,1.31911039352417
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,4096,1536,8,128,2,32,power_law_1.2,0.0646399974822998
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,4096,1536,8,128,2,32,power_law_1.01,1.795110321044922
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,4096,1536,8,128,2,32,power_law_1.2,1.8134143829345704
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,4096,1536,8,128,2,32,power_law_1.2,0.07162879705429077
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,4096,1536,8,128,2,32,power_law_1.01,4.097177505493164
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,4096,1536,8,128,2,32,power_law_1.2,0.08532480001449586
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,4096,1536,8,128,2,32,power_law_1.2,4.286764907836914
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,4096,1536,8,128,2,32,balanced,0.6548693180084229
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,4096,1536,8,128,2,32,power_law_1.2,0.09279999732971192
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,4096,1536,8,128,2,32,power_law_1.2,0.11470719575881957
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,4096,1536,8,128,2,32,power_law_1.2,0.12234879732131958
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,4096,1536,8,128,2,32,power_law_1.2,0.17663359642028809
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,4096,1536,8,128,2,32,power_law_1.2,0.20794239044189453
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,4096,1536,8,128,2,32,power_law_1.2,0.3126784086227417
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,4096,1536,8,128,2,32,balanced,1.1271573702494304
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,4096,1536,8,128,2,32,power_law_1.2,0.5088448047637939
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,4096,1536,8,128,2,32,power_law_1.2,0.5990399837493896
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,4096,1536,8,128,2,32,power_law_1.2,0.8535552024841309
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,4096,1536,8,128,2,32,power_law_1.2,1.2632448196411132
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,4096,1536,8,128,2,32,power_law_1.2,1.81343994140625
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,4096,1536,8,128,2,32,power_law_1.2,3.6587520599365235
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,4096,1536,8,128,2,32,balanced,1.2896160284678142
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,4096,1536,8,128,2,32,power_law_1.2,0.030067199468612672
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,4096,1536,8,128,2,32,power_law_1.2,0.027084800601005554
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,4096,1536,8,128,2,32,power_law_1.2,0.027929601073265076
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,4096,1536,8,128,4,16,balanced,0.03368533402681351
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,4096,1536,8,128,2,32,power_law_1.2,0.03116160035133362
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,4096,1536,8,128,2,32,power_law_1.2,0.030931198596954347
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,4096,1536,8,128,4,16,balanced,0.03427733232577642
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,4096,1536,8,128,4,16,balanced,0.03057066599527995
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,4096,1536,8,128,2,32,power_law_1.2,0.03270399868488312
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,4096,1536,8,128,4,16,balanced,0.03846933444341024
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,4096,1536,8,128,2,32,power_law_1.2,0.03224959969520569
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,4096,1536,8,128,4,16,balanced,0.04865066707134247
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,4096,1536,8,128,2,32,power_law_1.2,0.03560320138931274
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,4096,1536,8,128,4,16,balanced,0.0498986691236496
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,4096,1536,8,128,2,32,power_law_1.2,0.03767040073871612
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,4096,1536,8,128,4,16,balanced,0.05002133548259735
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,4096,1536,8,128,2,32,power_law_1.2,0.03874559998512268
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,4096,1536,8,128,4,16,balanced,0.05011733373006185
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,4096,1536,8,128,2,32,power_law_1.2,0.04168320000171662
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,4096,1536,8,128,4,16,balanced,0.050399998823801674
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,4096,1536,8,128,2,32,power_law_1.2,0.047705599665641786
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,4096,1536,8,128,4,16,balanced,0.05100800096988678
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,4096,1536,8,128,2,32,power_law_1.2,0.04995200037956238
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,4096,1536,8,128,4,16,balanced,0.051141331593195595
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,4096,1536,8,128,4,16,balanced,0.05227200190226237
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,4096,1536,8,128,2,32,power_law_1.2,0.05317760109901428
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,4096,1536,8,128,4,16,balanced,0.052704001466433205
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,4096,1536,8,128,4,16,balanced,0.0543146679798762
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,4096,1536,8,128,2,32,power_law_1.2,0.05998079776763916
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,4096,1536,8,128,4,16,balanced,0.05729066828886668
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,4096,1536,8,128,2,32,power_law_1.2,0.06223359704017639
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,4096,1536,8,128,4,16,balanced,0.058362667759259544
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,4096,1536,8,128,4,16,balanced,0.059706668059031166
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,4096,1536,8,128,2,32,power_law_1.2,0.07876480221748353
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,4096,1536,8,128,4,16,balanced,0.07116266588370006
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,4096,1536,8,128,2,32,power_law_1.2,0.08541439771652222
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,4096,1536,8,128,4,16,balanced,0.06454400221506755
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,4096,1536,8,128,2,32,power_law_1.2,0.12226560115814208
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,4096,1536,8,128,4,16,balanced,0.032186667124430336
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,4096,1536,8,128,4,16,balanced,0.07824533184369405
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,4096,1536,8,128,4,16,balanced,0.03249066571394602
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,4096,1536,8,128,2,32,power_law_1.2,0.13682559728622437
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,4096,1536,8,128,4,16,balanced,0.033674667278925575
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,4096,1536,8,128,4,16,balanced,0.07367999851703644
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,4096,1536,8,128,4,16,balanced,0.035301332672437034
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,4096,1536,8,128,2,32,power_law_1.2,0.1654207944869995
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,4096,1536,8,128,4,16,balanced,0.03920533259709676
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,4096,1536,8,128,4,16,balanced,0.040735999743143715
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,4096,1536,8,128,4,16,balanced,0.09809600313504536
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,4096,1536,8,128,2,32,power_law_1.2,0.21726720333099364
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,4096,1536,8,128,4,16,balanced,0.04080000023047129
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,4096,1536,8,128,4,16,balanced,0.0408746674656868
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,4096,1536,8,128,2,32,power_law_1.2,0.3886336088180542
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,4096,1536,8,128,4,16,balanced,0.040752001106739044
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,4096,1536,8,128,4,16,balanced,0.04154666761557261
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,4096,1536,8,128,4,16,balanced,0.10136533776919048
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,4096,1536,8,128,2,32,power_law_1.2,0.6863552093505859
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,4096,1536,8,128,4,16,balanced,0.04155199974775314
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,4096,1536,8,128,4,16,balanced,0.042170668641726174
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,4096,1536,8,128,2,32,power_law_1.2,0.7751232147216797
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,4096,1536,8,128,4,16,balanced,0.044218664367993675
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,4096,1536,8,128,2,32,power_law_1.2,1.2479743957519531
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,4096,1536,8,128,4,16,balanced,0.04689066608746847
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,4096,1536,8,128,4,16,balanced,0.14308266838391623
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,4096,1536,8,128,4,16,balanced,0.0491839994986852
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,4096,1536,8,128,2,32,power_law_1.2,1.4215616226196288
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,4096,1536,8,128,4,16,balanced,0.048351998130480446
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,4096,1536,8,128,4,16,balanced,0.051488002141316734
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,4096,1536,8,128,2,32,power_law_1.2,1.7771392822265626
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,4096,1536,8,128,4,16,balanced,0.06487999856472015
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,4096,1536,8,128,4,16,balanced,0.1585760017236074
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,4096,1536,8,128,4,16,balanced,0.06529066463311513
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,4096,1536,8,128,2,32,power_law_1.2,3.4913089752197264
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,4096,1536,8,128,4,16,balanced,0.07800533374150594
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,4096,1536,8,128,2,32,power_law_1.2,8.760140991210937
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,4096,1536,8,128,4,16,power_law_1.01,0.04732159972190857
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,4096,1536,8,128,4,16,balanced,0.08685866991678874
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,4096,1536,8,128,4,16,power_law_1.01,0.035545599460601804
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,4096,1536,8,128,4,16,balanced,0.1092800001303355
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,4096,1536,8,128,4,16,power_law_1.01,0.0367680013179779
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,4096,1536,8,128,4,16,balanced,0.24778133630752563
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,4096,1536,8,128,4,16,power_law_1.01,0.040659201145172116
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,4096,1536,8,128,4,16,balanced,0.1216373344262441
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,4096,1536,8,128,4,16,power_law_1.01,0.045075199007987975
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,4096,1536,8,128,4,16,power_law_1.01,0.048607999086380006
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,4096,1536,8,128,4,16,power_law_1.01,0.041920000314712526
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,4096,1536,8,128,4,16,balanced,0.02720533311367035
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,4096,1536,8,128,4,16,power_law_1.01,0.04922240078449249
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,4096,1536,8,128,4,16,balanced,0.1704053282737732
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,4096,1536,8,128,4,16,power_law_1.01,0.038252800703048706
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,4096,1536,8,128,4,16,power_law_1.01,0.0505407989025116
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,4096,1536,8,128,4,16,balanced,0.027327999472618103
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,4096,1536,8,128,4,16,balanced,0.027914665639400482
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,4096,1536,8,128,4,16,power_law_1.01,0.03443840146064758
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,4096,1536,8,128,4,16,power_law_1.01,0.051558399200439455
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,4096,1536,8,128,4,16,balanced,0.29683732986450195
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,4096,1536,8,128,4,16,balanced,0.02979733298222224
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,4096,1536,8,128,4,16,power_law_1.01,0.05140479803085327
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,4096,1536,8,128,4,16,power_law_1.01,0.036006399989128114
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,4096,1536,8,128,4,16,balanced,0.03514666606982549
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,4096,1536,8,128,4,16,balanced,0.20637333393096924
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,4096,1536,8,128,4,16,power_law_1.01,0.03797119855880737
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,4096,1536,8,128,4,16,power_law_1.01,0.056992000341415404
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,4096,1536,8,128,4,16,balanced,0.0359253336985906
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,4096,1536,8,128,4,16,power_law_1.01,0.04118399918079376
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,4096,1536,8,128,4,16,power_law_1.01,0.05842559933662415
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,4096,1536,8,128,4,16,balanced,0.03597866743803024
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,4096,1536,8,128,4,16,power_law_1.01,0.04063999950885773
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,4096,1536,8,128,4,16,power_law_1.01,0.05940480232238769
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,4096,1536,8,128,4,16,balanced,0.035973332822322845
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,4096,1536,8,128,4,16,power_law_1.01,0.040556800365447995
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,4096,1536,8,128,4,16,balanced,0.03640000025431315
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,4096,1536,8,128,4,16,power_law_1.01,0.06032639741897583
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,4096,1536,8,128,4,16,power_law_1.01,0.0430400013923645
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,4096,1536,8,128,4,16,balanced,0.038202665746212006
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,4096,1536,8,128,4,16,power_law_1.01,0.03480319976806641
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,4096,1536,8,128,4,16,balanced,0.30537599325180054
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,4096,1536,8,128,4,16,power_law_1.01,0.06664959788322448
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,4096,1536,8,128,4,16,balanced,0.038005332152048744
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,4096,1536,8,128,4,16,power_law_1.01,0.044095999002456664
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,4096,1536,8,128,4,16,power_law_1.01,0.06647679805755616
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,4096,1536,8,128,4,16,power_law_1.01,0.029094401001930236
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,4096,1536,8,128,4,16,power_law_1.01,0.046054399013519286
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,4096,1536,8,128,4,16,balanced,0.03811199963092804
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,4096,1536,8,128,4,16,balanced,0.3390186627705892
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,4096,1536,8,128,4,16,power_law_1.01,0.07516160011291503
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,4096,1536,8,128,4,16,power_law_1.01,0.028070399165153505
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,4096,1536,8,128,4,16,power_law_1.01,0.04742400050163269
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,4096,1536,8,128,4,16,balanced,0.040405333042144775
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,4096,1536,8,128,4,16,power_law_1.01,0.0917248010635376
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,4096,1536,8,128,4,16,power_law_1.01,0.03252480030059814
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,4096,1536,8,128,4,16,power_law_1.01,0.0492031991481781
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,4096,1536,8,128,4,16,balanced,0.040421334405740104
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,4096,1536,8,128,4,16,power_law_1.01,0.03292160034179688
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,4096,1536,8,128,4,16,power_law_1.01,0.08986240029335021
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,4096,1536,8,128,4,16,power_law_1.01,0.05070080161094666
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,4096,1536,8,128,4,16,power_law_1.01,0.035846400260925296
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,4096,1536,8,128,4,16,power_law_1.01,0.1050879955291748
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,4096,1536,8,128,4,16,power_law_1.01,0.05987840294837952
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,4096,1536,8,128,4,16,balanced,0.04930133124192556
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,4096,1536,8,128,4,16,balanced,0.3789546489715576
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,4096,1536,8,128,4,16,power_law_1.01,0.03700479865074158
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,4096,1536,8,128,4,16,power_law_1.01,0.062067198753356936
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,4096,1536,8,128,4,16,power_law_1.01,0.12433279752731323
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,4096,1536,8,128,4,16,balanced,0.05061866839726766
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,4096,1536,8,128,4,16,power_law_1.01,0.036262398958206175
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,4096,1536,8,128,4,16,power_law_1.01,0.06554239988327026
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,4096,1536,8,128,4,16,power_law_1.01,0.16459519863128663
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,4096,1536,8,128,4,16,power_law_1.01,0.08354560136795045
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,4096,1536,8,128,4,16,power_law_1.01,0.04081920087337494
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,4096,1536,8,128,4,16,power_law_1.01,0.17756799459457398
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,4096,1536,8,128,4,16,power_law_1.01,0.0811456024646759
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,4096,1536,8,128,4,16,power_law_1.01,0.2727807998657227
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,4096,1536,8,128,4,16,power_law_1.01,0.04252159893512726
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,4096,1536,8,128,4,16,power_law_1.2,0.04715520143508911
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,4096,1536,8,128,4,16,power_law_1.01,0.0970304012298584
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,4096,1536,8,128,4,16,power_law_1.01,0.2801408052444458
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,4096,1536,8,128,4,16,power_law_1.01,0.045100799202919005
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,4096,1536,8,128,4,16,power_law_1.2,0.03612160086631775
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,4096,1536,8,128,4,16,balanced,0.05375466744105021
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,4096,1536,8,128,4,16,power_law_1.01,0.11183359622955322
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,4096,1536,8,128,4,16,power_law_1.01,0.4490687847137451
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,4096,1536,8,128,4,16,power_law_1.01,0.04661119878292084
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,4096,1536,8,128,4,16,power_law_1.2,0.035699200630187986
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,4096,1536,8,128,4,16,balanced,0.06137066582838694
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,4096,1536,8,128,4,16,power_law_1.01,0.16514559984207153
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,4096,1536,8,128,4,16,power_law_1.01,0.04832000136375427
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,4096,1536,8,128,4,16,power_law_1.01,0.5603328227996827
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,4096,1536,8,128,4,16,power_law_1.2,0.04179840087890625
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,4096,1536,8,128,4,16,balanced,0.49349331855773926
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,4096,1536,8,128,4,16,power_law_1.01,0.18528000116348267
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,4096,1536,8,128,4,16,balanced,0.46325333913167316
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,4096,1536,8,128,4,16,power_law_1.01,0.05253120064735413
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,4096,1536,8,128,4,16,balanced,0.06427200138568878
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,4096,1536,8,128,4,16,power_law_1.01,0.682150411605835
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,4096,1536,8,128,4,16,power_law_1.2,0.04195199906826019
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,4096,1536,8,128,4,16,power_law_1.01,0.25189759731292727
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,4096,1536,8,128,4,16,power_law_1.2,0.048640000820159915
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,4096,1536,8,128,4,16,power_law_1.01,1.07258882522583
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,4096,1536,8,128,4,16,power_law_1.01,0.06280320286750793
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,4096,1536,8,128,4,16,power_law_1.01,0.3124991893768311
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,4096,1536,8,128,4,16,power_law_1.2,0.05000320076942444
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,4096,1536,8,128,4,16,power_law_1.01,0.06711040139198303
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,4096,1536,8,128,4,16,power_law_1.01,0.5031936168670654
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,4096,1536,8,128,4,16,balanced,0.07958933214346568
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,4096,1536,8,128,4,16,power_law_1.01,2.3884416580200196
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,4096,1536,8,128,4,16,power_law_1.2,0.05146880149841308
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,4096,1536,8,128,4,16,power_law_1.01,0.6254335880279541
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,4096,1536,8,128,4,16,power_law_1.2,0.05304960012435913
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,4096,1536,8,128,4,16,balanced,0.08778132994969685
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,4096,1536,8,128,4,16,power_law_1.01,0.6830143928527832
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,4096,1536,8,128,4,16,power_law_1.01,0.06965759992599488
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,4096,1536,8,128,4,16,power_law_1.2,0.05419520139694214
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,4096,1536,8,128,4,16,power_law_1.01,1.2958144187927245
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,4096,1536,8,128,4,16,power_law_1.01,0.09221760034561158
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,4096,1536,8,128,4,16,power_law_1.2,0.0561024010181427
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,4096,1536,8,128,4,16,power_law_1.01,0.10168319940567017
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,4096,1536,8,128,4,16,power_law_1.2,0.05683839917182922
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,4096,1536,8,128,4,16,power_law_1.01,2.587571144104004
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,4096,1536,8,128,4,16,power_law_1.2,0.06039680242538452
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,4096,1536,8,128,4,16,balanced,0.11544533570607503
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,4096,1536,8,128,4,16,power_law_1.01,0.11452800035476685
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,4096,1536,8,128,4,16,power_law_1.2,0.061484801769256595
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,4096,1536,8,128,4,16,power_law_1.01,0.14742399454116822
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,4096,1536,8,128,4,16,power_law_1.2,0.07041280269622803
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,4096,1536,8,128,4,16,balanced,0.6936639944712321
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,4096,1536,8,128,4,16,balanced,0.13470932841300964
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,4096,1536,8,128,4,16,power_law_1.2,0.07466880083084107
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,4096,1536,8,128,4,16,power_law_1.01,0.24574079513549804
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,4096,1536,8,128,4,16,power_law_1.2,0.08288000226020813
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,4096,1536,8,128,4,16,power_law_1.01,0.27653119564056394
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,4096,1536,8,128,4,16,power_law_1.2,0.09812480211257935
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,4096,1536,8,128,4,16,power_law_1.2,0.09829760193824769
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,4096,1536,8,128,4,16,balanced,0.19992534319559732
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,4096,1536,8,128,4,16,power_law_1.01,0.40088319778442383
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,4096,1536,8,128,4,16,power_law_1.2,0.1223680019378662
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,4096,1536,8,128,4,16,power_law_1.01,0.509004783630371
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,4096,1536,8,128,4,16,power_law_1.2,0.13447680473327636
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,4096,1536,8,128,4,16,power_law_1.01,0.7531583786010743
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,4096,1536,8,128,4,16,power_law_1.2,0.204256010055542
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,4096,1536,8,128,4,16,power_law_1.01,1.0266176223754884
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,4096,1536,8,128,4,16,power_law_1.2,0.2195647954940796
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,4096,1536,8,128,4,16,balanced,0.2635519901911418
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,4096,1536,8,128,4,16,power_law_1.2,0.27294719219207764
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,4096,1536,8,128,4,16,power_law_1.01,1.2874048233032227
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,4096,1536,8,128,4,16,power_law_1.2,0.423795223236084
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,4096,1536,8,128,4,16,balanced,0.9511146545410156
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,4096,1536,8,128,4,16,power_law_1.01,1.8495616912841797
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,4096,1536,8,128,4,16,power_law_1.2,0.5005568027496338
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,4096,1536,8,128,4,16,power_law_1.2,0.8605952262878418
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,4096,1536,8,128,4,16,power_law_1.01,3.88076171875
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,4096,1536,8,128,4,16,power_law_1.2,1.0234432220458984
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,4096,1536,8,128,4,16,balanced,0.38102400302886963
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,4096,1536,8,128,4,16,power_law_1.2,1.5132351875305177
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,4096,1536,8,128,4,16,power_law_1.2,4.414131164550781
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,4096,1536,8,128,4,16,balanced,0.49486398696899414
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,4096,1536,8,128,4,16,balanced,1.3584426244099934
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,4096,1536,8,128,4,16,power_law_1.2,0.042310398817062375
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,4096,1536,8,128,4,16,power_law_1.2,0.033055999875068666
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,4096,1536,8,128,4,16,power_law_1.2,0.03391999900341034
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,4096,1536,8,128,4,16,balanced,0.6101546684900919
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,4096,1536,8,128,4,16,power_law_1.2,0.03609600067138672
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,4096,1536,8,128,4,16,power_law_1.2,0.03670400083065033
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,4096,1536,8,128,4,16,power_law_1.2,0.04008319973945618
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,4096,1536,8,128,4,16,power_law_1.2,0.03920640051364899
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,4096,1536,8,128,4,16,power_law_1.2,0.040249601006507874
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,4096,1536,8,128,4,16,power_law_1.2,0.04242559969425201
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,4096,1536,8,128,4,16,power_law_1.2,0.04319359958171844
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,4096,1536,8,128,4,16,power_law_1.2,0.04572800099849701
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,4096,1536,8,128,4,16,power_law_1.2,0.04682239890098572
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,4096,1536,8,128,4,16,power_law_1.2,0.04885759949684143
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,4096,1536,8,128,4,16,power_law_1.2,0.05143679976463318
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,4096,1536,8,128,4,16,power_law_1.2,0.06338559985160827
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,4096,1536,8,128,4,16,power_law_1.2,0.06471040248870849
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,4096,1536,8,128,4,16,balanced,0.9490293661753336
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,4096,1536,8,128,4,16,power_law_1.2,0.06616320013999939
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,4096,1536,8,128,4,16,power_law_1.2,0.08261119723320007
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,4096,1536,8,128,4,16,power_law_1.2,0.09037439823150635
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,4096,1536,8,128,4,16,power_law_1.2,0.11238399744033814
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,4096,1536,8,128,4,16,power_law_1.2,0.13626240491867064
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,4096,1536,8,128,4,16,power_law_1.2,0.17420799732208253
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,4096,1536,8,128,4,16,power_law_1.2,0.21364479064941405
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,4096,1536,8,128,4,16,power_law_1.2,0.28089599609375
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,4096,1536,8,128,4,16,power_law_1.2,0.3907968044281006
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,4096,1536,8,128,4,16,power_law_1.2,0.6090496063232422
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,4096,1536,8,128,4,16,power_law_1.2,0.867251205444336
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,4096,1536,8,128,4,16,power_law_1.2,0.9019071578979492
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,4096,1536,8,128,4,16,power_law_1.2,1.7179904937744142
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,4096,1536,8,128,4,16,power_law_1.2,4.035033416748047
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,4096,1536,8,128,4,16,balanced,1.876981258392334
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,4096,1536,8,128,8,8,balanced,0.0328053335348765
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,4096,1536,8,128,8,8,balanced,0.030005333324273426
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,4096,1536,8,128,4,16,power_law_1.2,0.03480960130691528
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,4096,1536,8,128,8,8,balanced,0.030954666435718536
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,4096,1536,8,128,4,16,power_law_1.2,0.028377598524093627
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,4096,1536,8,128,8,8,balanced,0.035429333647092186
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,4096,1536,8,128,4,16,power_law_1.2,0.028940799832344054
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,4096,1536,8,128,8,8,balanced,0.04974933465321859
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,4096,1536,8,128,4,16,power_law_1.2,0.03184640109539032
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,4096,1536,8,128,8,8,balanced,0.051039998730023704
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,4096,1536,8,128,8,8,balanced,0.051914667089780174
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,4096,1536,8,128,4,16,power_law_1.2,0.03472639918327332
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,4096,1536,8,128,8,8,balanced,0.052613332867622375
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,4096,1536,8,128,4,16,power_law_1.2,0.03576320111751556
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,4096,1536,8,128,8,8,balanced,0.052341332038243614
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,4096,1536,8,128,4,16,power_law_1.2,0.03703039884567261
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,4096,1536,8,128,8,8,balanced,0.03297066688537598
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,4096,1536,8,128,4,16,power_law_1.2,0.03852159976959228
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,4096,1536,8,128,8,8,balanced,0.05306133131186167
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,4096,1536,8,128,8,8,balanced,0.03253866732120514
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,4096,1536,8,128,4,16,power_law_1.2,0.04239999949932098
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,4096,1536,8,128,8,8,balanced,0.05346666773160299
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,4096,1536,8,128,8,8,balanced,0.03509333233038584
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,4096,1536,8,128,4,16,power_law_1.2,0.043321600556373595
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,4096,1536,8,128,8,8,balanced,0.05453333258628845
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,4096,1536,8,128,8,8,balanced,0.03766933331886927
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,4096,1536,8,128,8,8,balanced,0.05533866584300995
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,4096,1536,8,128,4,16,power_law_1.2,0.04493440091609955
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,4096,1536,8,128,8,8,balanced,0.04398400088151296
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,4096,1536,8,128,4,16,power_law_1.2,0.0469760000705719
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,4096,1536,8,128,8,8,balanced,0.05913599828879038
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,4096,1536,8,128,8,8,balanced,0.04509866734345754
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,4096,1536,8,128,4,16,power_law_1.2,0.049292799830436704
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,4096,1536,8,128,8,8,balanced,0.06086933116118113
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,4096,1536,8,128,8,8,balanced,0.044768000642458596
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,4096,1536,8,128,4,16,power_law_1.2,0.053446400165557864
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,4096,1536,8,128,8,8,balanced,0.06047466893990835
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,4096,1536,8,128,8,8,balanced,0.045109331607818604
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,4096,1536,8,128,8,8,balanced,0.04534933467706045
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,4096,1536,8,128,8,8,balanced,0.06404266754786174
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,4096,1536,8,128,4,16,power_law_1.2,0.06429439783096313
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,4096,1536,8,128,8,8,balanced,0.04651733239491781
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,4096,1536,8,128,8,8,balanced,0.07860266665617625
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,4096,1536,8,128,8,8,power_law_1.01,0.03688960075378418
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,4096,1536,8,128,4,16,power_law_1.2,0.06981120109558106
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,4096,1536,8,128,8,8,balanced,0.04660800099372864
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,4096,1536,8,128,8,8,balanced,0.07247999807198842
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,4096,1536,8,128,8,8,power_law_1.01,0.03763200044631958
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,4096,1536,8,128,8,8,balanced,0.0469760000705719
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,4096,1536,8,128,8,8,power_law_1.01,0.036339199542999266
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,4096,1536,8,128,8,8,balanced,0.047775998711586
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,4096,1536,8,128,8,8,balanced,0.08853866656621297
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,4096,1536,8,128,4,16,power_law_1.2,0.07194240093231201
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,4096,1536,8,128,8,8,power_law_1.01,0.04051199853420258
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,4096,1536,8,128,8,8,balanced,0.05073066552480062
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,4096,1536,8,128,4,16,power_law_1.2,0.0868607997894287
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,4096,1536,8,128,8,8,balanced,0.08685866991678874
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,4096,1536,8,128,8,8,balanced,0.028346667687098186
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,4096,1536,8,128,8,8,power_law_1.01,0.042310398817062375
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,4096,1536,8,128,8,8,balanced,0.053685332338015236
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,4096,1536,8,128,4,16,power_law_1.2,0.10724480152130127
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,4096,1536,8,128,8,8,power_law_1.01,0.05070719718933105
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,4096,1536,8,128,8,8,balanced,0.029781334102153778
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,4096,1536,8,128,8,8,power_law_1.01,0.03699840009212494
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,4096,1536,8,128,8,8,balanced,0.055439998706181846
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,4096,1536,8,128,8,8,balanced,0.03046933313210805
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,4096,1536,8,128,8,8,balanced,0.11987732847531636
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,4096,1536,8,128,8,8,power_law_1.01,0.050892800092697144
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,4096,1536,8,128,4,16,power_law_1.2,0.13815679550170898
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,4096,1536,8,128,8,8,balanced,0.03323733309904734
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,4096,1536,8,128,8,8,power_law_1.01,0.03418880105018616
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,4096,1536,8,128,8,8,balanced,0.05778133372465769
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,4096,1536,8,128,8,8,balanced,0.03881066789229711
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,4096,1536,8,128,4,16,power_law_1.2,0.16499199867248535
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,4096,1536,8,128,8,8,power_law_1.01,0.051744002103805545
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,4096,1536,8,128,8,8,power_law_1.01,0.036652800440788266
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,4096,1536,8,128,8,8,balanced,0.07229866584142049
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,4096,1536,8,128,8,8,balanced,0.0395359992980957
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,4096,1536,8,128,8,8,power_law_1.01,0.05628160238265991
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,4096,1536,8,128,8,8,balanced,0.041306667029857635
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,4096,1536,8,128,8,8,balanced,0.12686399618784586
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,4096,1536,8,128,8,8,power_law_1.01,0.03758719861507416
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,4096,1536,8,128,8,8,balanced,0.040752001106739044
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,4096,1536,8,128,4,16,power_law_1.2,0.27664639949798586
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,4096,1536,8,128,8,8,balanced,0.07228266696135204
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,4096,1536,8,128,8,8,power_law_1.01,0.05656319856643677
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,4096,1536,8,128,8,8,balanced,0.04138666639725367
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,4096,1536,8,128,8,8,power_law_1.01,0.03747200071811676
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,4096,1536,8,128,4,16,power_law_1.2,0.3190272092819214
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,4096,1536,8,128,8,8,balanced,0.04314666489760081
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,4096,1536,8,128,8,8,power_law_1.01,0.058182400465011594
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,4096,1536,8,128,8,8,balanced,0.08872000376383464
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,4096,1536,8,128,8,8,balanced,0.043338666359583534
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,4096,1536,8,128,8,8,power_law_1.01,0.04348799884319306
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,4096,1536,8,128,8,8,power_law_1.01,0.06047359704971313
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,4096,1536,8,128,8,8,balanced,0.045882667104403176
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,4096,1536,8,128,8,8,balanced,0.18389334281285605
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,4096,1536,8,128,4,16,power_law_1.2,0.531718397140503
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,4096,1536,8,128,8,8,power_law_1.01,0.043987199664115906
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,4096,1536,8,128,8,8,balanced,0.04801600178082784
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,4096,1536,8,128,8,8,power_law_1.01,0.061382400989532473
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,4096,1536,8,128,8,8,balanced,0.09457066655158997
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,4096,1536,8,128,8,8,balanced,0.04890666902065277
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,4096,1536,8,128,8,8,power_law_1.01,0.04560000002384186
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,4096,1536,8,128,4,16,power_law_1.2,0.6417280197143554
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,4096,1536,8,128,8,8,power_law_1.01,0.06115840077400207
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,4096,1536,8,128,8,8,power_law_1.01,0.046265599131584165
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,4096,1536,8,128,4,16,power_law_1.2,1.1518464088439941
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,4096,1536,8,128,8,8,power_law_1.01,0.06682239770889283
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,4096,1536,8,128,8,8,balanced,0.13134933511416116
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,4096,1536,8,128,8,8,balanced,0.060965334375699363
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,4096,1536,8,128,8,8,power_law_1.01,0.047660800814628604
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,4096,1536,8,128,4,16,power_law_1.2,1.4025152206420899
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,4096,1536,8,128,8,8,power_law_1.01,0.070796799659729
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,4096,1536,8,128,8,8,balanced,0.06037333110968272
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,4096,1536,8,128,8,8,balanced,0.21577600638071695
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,4096,1536,8,128,8,8,power_law_1.01,0.05017600059509277
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,4096,1536,8,128,8,8,power_law_1.01,0.0803391993045807
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,4096,1536,8,128,4,16,power_law_1.2,1.4900544166564942
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,4096,1536,8,128,8,8,balanced,0.15027733643849692
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,4096,1536,8,128,8,8,power_law_1.01,0.05206400156021118
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,4096,1536,8,128,8,8,power_law_1.01,0.09202560186386108
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,4096,1536,8,128,4,16,power_law_1.2,3.948019027709961
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,4096,1536,8,128,8,8,power_law_1.01,0.0542527973651886
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,4096,1536,8,128,8,8,power_law_1.01,0.09393919706344604
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,4096,1536,8,128,8,8,balanced,0.06599999964237213
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,4096,1536,8,128,8,8,power_law_1.01,0.0531328022480011
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,4096,1536,8,128,8,8,power_law_1.01,0.11518720388412476
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,4096,1536,8,128,4,16,power_law_1.2,6.1160320281982425
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,4096,1536,8,128,8,8,balanced,0.21894933780034384
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,4096,1536,8,128,8,8,balanced,0.07758399844169617
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,4096,1536,8,128,8,8,power_law_1.01,0.05856000185012818
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,4096,1536,8,128,8,8,power_law_1.01,0.12234879732131958
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,4096,1536,8,128,8,8,balanced,0.32681065797805786
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,4096,1536,8,128,8,8,balanced,0.08131200075149536
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,4096,1536,8,128,8,8,power_law_1.01,0.06423680186271667
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,4096,1536,8,128,8,8,power_law_1.01,0.1581760048866272
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,4096,1536,8,128,8,8,power_law_1.01,0.07342079877853394
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,4096,1536,8,128,8,8,power_law_1.01,0.18279039859771729
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,4096,1536,8,128,8,8,power_law_1.01,0.08784639835357666
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,4096,1536,8,128,8,8,balanced,0.2685866753260295
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,4096,1536,8,128,8,8,power_law_1.01,0.2613055944442749
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,4096,1536,8,128,8,8,balanced,0.10447466373443604
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,4096,1536,8,128,8,8,power_law_1.01,0.09163519740104675
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,4096,1536,8,128,8,8,power_law_1.01,0.34179201126098635
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,4096,1536,8,128,8,8,balanced,0.11955733100573222
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,4096,1536,8,128,8,8,power_law_1.01,0.11139839887619019
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,4096,1536,8,128,8,8,power_law_1.01,0.4197375774383545
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,4096,1536,8,128,8,8,power_law_1.01,0.12451200485229492
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,4096,1536,8,128,8,8,power_law_1.01,0.5826943874359131
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,4096,1536,8,128,8,8,balanced,0.40858666102091473
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,4096,1536,8,128,8,8,power_law_1.01,0.170579195022583
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,4096,1536,8,128,8,8,power_law_1.01,0.7980351924896241
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,4096,1536,8,128,8,8,balanced,0.40386664867401123
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,4096,1536,8,128,8,8,power_law_1.01,0.20327680110931395
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,4096,1536,8,128,8,8,balanced,0.17669866482416788
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,4096,1536,8,128,8,8,power_law_1.01,1.2119104385375976
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,4096,1536,8,128,8,8,power_law_1.01,0.28324480056762696
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,4096,1536,8,128,8,8,power_law_1.01,0.3894079923629761
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,4096,1536,8,128,8,8,power_law_1.01,2.540928077697754
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,4096,1536,8,128,8,8,balanced,0.22684800624847412
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,4096,1536,8,128,8,8,power_law_1.01,0.6080639839172364
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,4096,1536,8,128,8,8,power_law_1.01,0.7266367912292481
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,4096,1536,8,128,8,8,power_law_1.01,0.8943743705749512
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,4096,1536,8,128,8,8,balanced,0.5128426551818848
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,4096,1536,8,128,8,8,balanced,0.4857706626256307
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,4096,1536,8,128,8,8,power_law_1.01,1.5589311599731446
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,4096,1536,8,128,8,8,balanced,0.329365332921346
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,4096,1536,8,128,8,8,power_law_1.01,3.273555374145508
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,4096,1536,8,128,8,8,balanced,0.41910401980082196
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,4096,1536,8,128,8,8,power_law_1.01,0.0349375993013382
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,4096,1536,8,128,8,8,power_law_1.01,0.030924800038337707
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,4096,1536,8,128,8,8,balanced,0.6339253187179565
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,4096,1536,8,128,8,8,power_law_1.01,0.03129599988460541
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,4096,1536,8,128,8,8,power_law_1.01,0.0349375993013382
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,4096,1536,8,128,8,8,balanced,0.6109280188878378
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,4096,1536,8,128,8,8,power_law_1.2,0.03663359880447388
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,4096,1536,8,128,8,8,power_law_1.01,0.03749760091304779
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,4096,1536,8,128,8,8,power_law_1.2,0.03415040075778961
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,4096,1536,8,128,8,8,power_law_1.01,0.04180479943752289
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,4096,1536,8,128,8,8,power_law_1.2,0.03612160086631775
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,4096,1536,8,128,8,8,balanced,0.7041172981262207
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,4096,1536,8,128,8,8,power_law_1.01,0.04261760115623474
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,4096,1536,8,128,8,8,power_law_1.2,0.03946239948272705
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,4096,1536,8,128,8,8,power_law_1.01,0.044377601146698
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,4096,1536,8,128,8,8,power_law_1.2,0.04300160109996796
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,4096,1536,8,128,8,8,power_law_1.01,0.045459198951721194
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,4096,1536,8,128,8,8,power_law_1.2,0.051583999395370485
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,4096,1536,8,128,8,8,power_law_1.01,0.0469760000705719
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,4096,1536,8,128,8,8,balanced,0.796837329864502
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,4096,1536,8,128,8,8,power_law_1.2,0.05208960175514221
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,4096,1536,8,128,8,8,power_law_1.01,0.05056639909744263
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,4096,1536,8,128,8,8,power_law_1.2,0.05311999917030334
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,4096,1536,8,128,8,8,power_law_1.01,0.05367680191993714
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,4096,1536,8,128,8,8,power_law_1.2,0.056505602598190305
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,4096,1536,8,128,8,8,power_law_1.01,0.056383997201919556
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,4096,1536,8,128,8,8,power_law_1.2,0.057120001316070555
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,4096,1536,8,128,8,8,power_law_1.01,0.061260801553726194
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,4096,1536,8,128,8,8,balanced,0.9484639962514242
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,4096,1536,8,128,8,8,power_law_1.2,0.059910398721694944
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,4096,1536,8,128,8,8,power_law_1.01,0.06769279837608337
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,4096,1536,8,128,8,8,power_law_1.2,0.05997440218925476
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,4096,1536,8,128,8,8,power_law_1.01,0.07797120213508606
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,4096,1536,8,128,8,8,power_law_1.2,0.06169599890708923
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,4096,1536,8,128,8,8,power_law_1.2,0.06453120112419128
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,4096,1536,8,128,8,8,balanced,0.9850560029347738
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,4096,1536,8,128,8,8,power_law_1.2,0.0698751986026764
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,4096,1536,8,128,8,8,power_law_1.01,0.0824512004852295
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,4096,1536,8,128,8,8,power_law_1.2,0.07679359912872315
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,4096,1536,8,128,8,8,power_law_1.01,0.09405440092086792
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,4096,1536,8,128,8,8,power_law_1.2,0.08305919766426087
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,4096,1536,8,128,8,8,power_law_1.01,0.11960959434509277
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,4096,1536,8,128,8,8,power_law_1.2,0.09882879853248597
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,4096,1536,8,128,8,8,power_law_1.2,0.09791359901428223
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,4096,1536,8,128,8,8,power_law_1.01,0.15187840461730956
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,4096,1536,8,128,8,8,power_law_1.2,0.12253439426422119
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,4096,1536,8,128,8,8,power_law_1.01,0.19147520065307616
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,4096,1536,8,128,8,8,power_law_1.2,0.13714560270309448
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,4096,1536,8,128,8,8,power_law_1.2,0.17745920419692993
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,4096,1536,8,128,8,8,power_law_1.01,0.30229759216308594
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,4096,1536,8,128,8,8,power_law_1.2,0.23777918815612792
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,4096,1536,8,128,8,8,power_law_1.01,0.3657855987548828
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,4096,1536,8,128,8,8,power_law_1.2,0.3158463954925537
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,4096,1536,8,128,8,8,power_law_1.2,0.386847996711731
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,4096,1536,8,128,8,8,power_law_1.01,0.5208960056304932
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,4096,1536,8,128,8,8,power_law_1.2,0.6038015842437744
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,4096,1536,8,128,8,8,balanced,1.3711466789245605
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,4096,1536,8,128,8,8,power_law_1.01,0.6820608139038086
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,4096,1536,8,128,8,8,balanced,1.556282679239909
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,4096,1536,8,128,8,8,power_law_1.2,0.7991807937622071
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,4096,1536,8,128,8,8,power_law_1.01,0.9753279685974121
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,4096,1536,8,128,8,8,power_law_1.2,0.9828351974487305
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,4096,1536,8,128,8,8,power_law_1.01,1.4899392127990723
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,4096,1536,8,128,8,8,power_law_1.2,1.621811294555664
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,4096,1536,8,128,8,8,power_law_1.01,1.6627519607543946
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,4096,1536,8,128,8,8,power_law_1.01,2.534048080444336
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,4096,1536,8,128,8,8,power_law_1.2,4.036671829223633
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,4096,1536,8,128,8,8,balanced,1.8613707224527996
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,4096,1536,8,128,8,8,power_law_1.01,5.643404769897461
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,4096,1536,8,128,8,8,power_law_1.2,0.037427198886871335
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,4096,1536,8,128,8,8,power_law_1.2,0.032467201352119446
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,4096,1536,8,128,8,8,power_law_1.2,0.03470720052719116
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,4096,1536,8,128,8,8,balanced,3.0857601165771484
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,4096,1536,8,128,8,8,power_law_1.2,0.03665919899940491
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,4096,1536,8,128,8,8,power_law_1.2,0.03899520039558411
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,4096,1536,8,128,8,8,power_law_1.2,0.04407039880752563
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,4096,1536,8,128,8,8,power_law_1.2,0.04567680060863495
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,4096,1536,8,128,8,8,power_law_1.2,0.04604800045490265
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,4096,1536,8,128,8,8,power_law_1.2,0.0473471999168396
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,4096,1536,8,128,8,8,power_law_1.2,0.04856959879398346
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,4096,1536,8,128,8,8,power_law_1.2,0.034944000840187076
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,4096,1536,8,128,8,8,power_law_1.2,0.051097601652145386
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,4096,1536,8,128,8,8,power_law_1.2,0.03054719865322113
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,4096,1536,8,128,8,8,power_law_1.2,0.052799999713897705
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,4096,1536,8,128,8,8,power_law_1.2,0.031091201305389404
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,4096,1536,8,128,8,8,power_law_1.2,0.05742719769477844
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,4096,1536,8,128,8,8,power_law_1.2,0.03535360097885132
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,4096,1536,8,128,8,8,power_law_1.2,0.05630080103874206
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,4096,1536,8,128,16,4,balanced,0.035274667044480644
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,4096,1536,8,128,8,8,power_law_1.2,0.03772160112857818
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,4096,1536,8,128,8,8,power_law_1.2,0.06591359972953796
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,4096,1536,8,128,16,4,balanced,0.03535466641187668
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,4096,1536,8,128,8,8,power_law_1.2,0.06874880194664001
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,4096,1536,8,128,8,8,power_law_1.2,0.04167680144309997
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,4096,1536,8,128,16,4,balanced,0.04163199911514918
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,4096,1536,8,128,8,8,power_law_1.2,0.0438400000333786
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,4096,1536,8,128,8,8,power_law_1.2,0.07562239766120911
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,4096,1536,8,128,16,4,balanced,0.04243200023969015
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,4096,1536,8,128,8,8,power_law_1.2,0.044614401459693906
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,4096,1536,8,128,8,8,power_law_1.2,0.08873599767684937
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,4096,1536,8,128,16,4,balanced,0.058090666929880776
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,4096,1536,8,128,8,8,power_law_1.2,0.09453439712524414
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,4096,1536,8,128,8,8,power_law_1.2,0.04573439955711365
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,4096,1536,8,128,16,4,balanced,0.059205333391825356
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,4096,1536,8,128,8,8,power_law_1.2,0.11802239418029785
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,4096,1536,8,128,8,8,power_law_1.2,0.04759680032730103
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,4096,1536,8,128,16,4,balanced,0.05892266829808553
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,4096,1536,8,128,8,8,power_law_1.2,0.13791999816894532
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,4096,1536,8,128,8,8,power_law_1.2,0.05248640179634094
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,4096,1536,8,128,16,4,balanced,0.05945600072542826
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,4096,1536,8,128,8,8,power_law_1.2,0.05427839756011963
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,4096,1536,8,128,8,8,power_law_1.2,0.1815551996231079
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,4096,1536,8,128,16,4,balanced,0.059077332417170204
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,4096,1536,8,128,8,8,power_law_1.2,0.22872960567474365
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,4096,1536,8,128,8,8,power_law_1.2,0.056480002403259275
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,4096,1536,8,128,16,4,balanced,0.05950400233268738
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,4096,1536,8,128,8,8,power_law_1.2,0.3485759973526001
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,4096,1536,8,128,16,4,balanced,0.059989333152770996
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,4096,1536,8,128,8,8,power_law_1.2,0.06340479850769043
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,4096,1536,8,128,16,4,balanced,0.06221333146095276
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,4096,1536,8,128,8,8,power_law_1.2,0.4246016025543213
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,4096,1536,8,128,8,8,power_law_1.2,0.06907520294189454
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,4096,1536,8,128,16,4,balanced,0.06100266675154368
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,4096,1536,8,128,8,8,power_law_1.2,0.731763219833374
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,4096,1536,8,128,8,8,power_law_1.2,0.07835519909858704
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,4096,1536,8,128,16,4,balanced,0.0647680014371872
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,4096,1536,8,128,8,8,power_law_1.2,1.0037311553955077
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,4096,1536,8,128,16,4,balanced,0.06881066660086314
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,4096,1536,8,128,8,8,power_law_1.2,1.148838424682617
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,4096,1536,8,128,16,4,balanced,0.07008533179759979
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,4096,1536,8,128,8,8,power_law_1.2,0.08583040237426758
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,4096,1536,8,128,8,8,power_law_1.2,1.774355125427246
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,4096,1536,8,128,16,4,balanced,0.07529599964618683
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,4096,1536,8,128,8,8,power_law_1.2,0.0986240029335022
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,4096,1536,8,128,8,8,power_law_1.2,0.12627840042114258
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,4096,1536,8,128,16,4,balanced,0.08768533666928609
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,4096,1536,8,128,8,8,power_law_1.2,3.8430526733398436
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,4096,1536,8,128,16,4,balanced,0.08933867017428081
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,4096,1536,8,128,8,8,power_law_1.2,0.16239999532699584
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,4096,1536,8,128,8,8,power_law_1.2,0.20683519840240477
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,4096,1536,8,128,16,4,balanced,0.1058240036169688
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,4096,1536,8,128,16,4,balanced,0.11501333117485046
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,4096,1536,8,128,8,8,power_law_1.2,0.29711360931396485
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,4096,1536,8,128,8,8,power_law_1.2,0.4078400135040283
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,4096,1536,8,128,16,4,balanced,0.15362133582433066
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,4096,1536,8,128,8,8,power_law_1.2,0.5864511966705322
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,4096,1536,8,128,8,8,power_law_1.2,0.7855807781219483
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,4096,1536,8,128,16,4,balanced,0.1872746745745341
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,4096,1536,8,128,8,8,power_law_1.2,1.4745216369628906
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,4096,1536,8,128,8,8,power_law_1.2,1.360262393951416
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,4096,1536,8,128,8,8,power_law_1.2,1.9160320281982421
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,4096,1536,8,128,16,4,balanced,0.26183466116587323
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,4096,1536,8,128,8,8,power_law_1.2,4.01641616821289
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,4096,1536,8,128,8,8,power_law_1.2,9.347500610351563
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,4096,1536,8,128,16,4,balanced,0.03256533294916153
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,4096,1536,8,128,16,4,balanced,0.3572160005569458
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,4096,1536,8,128,16,4,balanced,0.033039999504884086
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,4096,1536,8,128,16,4,balanced,0.03486400097608566
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,4096,1536,8,128,16,4,balanced,0.03999999910593033
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,4096,1536,8,128,16,4,balanced,0.0490880012512207
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,4096,1536,8,128,16,4,balanced,0.04986133178075155
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,4096,1536,8,128,16,4,balanced,0.5166879892349243
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,4096,1536,8,128,16,4,balanced,0.04985066751639048
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,4096,1536,8,128,16,4,balanced,0.05020800232887268
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,4096,1536,8,128,16,4,balanced,0.05052266518274943
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,4096,1536,8,128,16,4,balanced,0.051829333106676735
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,4096,1536,8,128,16,4,power_law_1.01,0.03692800104618073
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,4096,1536,8,128,16,4,balanced,0.05176533261934916
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,4096,1536,8,128,16,4,power_law_1.01,0.03586559891700745
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,4096,1536,8,128,16,4,balanced,0.053823997577031456
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,4096,1536,8,128,16,4,power_law_1.01,0.04004479944705963
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,4096,1536,8,128,16,4,balanced,0.05454400181770325
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,4096,1536,8,128,16,4,power_law_1.01,0.033958399295806886
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,4096,1536,8,128,16,4,power_law_1.01,0.04437119960784912
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,4096,1536,8,128,16,4,balanced,0.673472007115682
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,4096,1536,8,128,16,4,balanced,0.058037335673967995
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,4096,1536,8,128,16,4,balanced,0.06471466521422069
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,4096,1536,8,128,16,4,power_law_1.01,0.04793600142002106
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,4096,1536,8,128,16,4,power_law_1.01,0.03464959859848023
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,4096,1536,8,128,16,4,power_law_1.01,0.05744640231132507
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,4096,1536,8,128,16,4,balanced,0.06433066725730896
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,4096,1536,8,128,16,4,power_law_1.01,0.034067198634147644
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,4096,1536,8,128,16,4,power_law_1.01,0.03979519903659821
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,4096,1536,8,128,16,4,power_law_1.01,0.05809919834136963
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,4096,1536,8,128,16,4,balanced,0.07331199944019318
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,4096,1536,8,128,16,4,power_law_1.01,0.040531200170516965
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,4096,1536,8,128,16,4,power_law_1.01,0.059628802537918094
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,4096,1536,8,128,16,4,power_law_1.01,0.04628480076789856
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,4096,1536,8,128,16,4,balanced,0.08301866551240285
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,4096,1536,8,128,16,4,power_law_1.01,0.04718720018863678
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,4096,1536,8,128,16,4,power_law_1.01,0.060159999132156375
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,4096,1536,8,128,16,4,power_law_1.01,0.048895999789237976
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,4096,1536,8,128,16,4,balanced,0.08903466661771138
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,4096,1536,8,128,16,4,power_law_1.01,0.06193280220031738
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,4096,1536,8,128,16,4,power_law_1.01,0.04996480047702789
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,4096,1536,8,128,16,4,power_law_1.01,0.05113599896430969
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,4096,1536,8,128,16,4,power_law_1.01,0.06259199976921082
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,4096,1536,8,128,16,4,balanced,0.10678399602572124
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,4096,1536,8,128,16,4,power_law_1.01,0.055027198791503903
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,4096,1536,8,128,16,4,power_law_1.01,0.06494719982147217
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,4096,1536,8,128,16,4,power_law_1.01,0.057107198238372806
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,4096,1536,8,128,16,4,balanced,0.8322986761728922
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,4096,1536,8,128,16,4,power_law_1.01,0.06812160015106201
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,4096,1536,8,128,16,4,power_law_1.01,0.06158080101013184
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,4096,1536,8,128,16,4,balanced,0.12220799922943115
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,4096,1536,8,128,16,4,power_law_1.01,0.0636352002620697
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,4096,1536,8,128,16,4,power_law_1.01,0.0690496027469635
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,4096,1536,8,128,16,4,power_law_1.01,0.07025920152664185
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,4096,1536,8,128,16,4,power_law_1.01,0.07639679908752442
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,4096,1536,8,128,16,4,power_law_1.01,0.07789440155029297
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,4096,1536,8,128,16,4,balanced,0.17108267545700073
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,4096,1536,8,128,16,4,power_law_1.01,0.0806335985660553
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,4096,1536,8,128,16,4,power_law_1.01,0.08217599987983704
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,4096,1536,8,128,16,4,power_law_1.01,0.09937279820442199
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,4096,1536,8,128,16,4,power_law_1.01,0.08597760200500489
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,4096,1536,8,128,16,4,power_law_1.01,0.1074944019317627
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,4096,1536,8,128,16,4,power_law_1.01,0.10757759809494019
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,4096,1536,8,128,16,4,balanced,0.2042400042215983
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,4096,1536,8,128,16,4,power_law_1.01,0.13233280181884766
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,4096,1536,8,128,16,4,power_law_1.01,0.10942720174789429
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,4096,1536,8,128,16,4,power_law_1.01,0.15627520084381102
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,4096,1536,8,128,16,4,power_law_1.01,0.13216639757156373
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,4096,1536,8,128,16,4,power_law_1.01,0.202508807182312
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,4096,1536,8,128,16,4,power_law_1.01,0.15217280387878418
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,4096,1536,8,128,16,4,power_law_1.01,0.26150400638580323
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,4096,1536,8,128,16,4,power_law_1.01,0.2048192024230957
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,4096,1536,8,128,16,4,power_law_1.01,0.36366078853607176
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,4096,1536,8,128,16,4,balanced,0.30243200063705444
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,4096,1536,8,128,16,4,power_law_1.01,0.48382081985473635
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,4096,1536,8,128,16,4,power_law_1.01,0.23349759578704835
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,4096,1536,8,128,16,4,power_law_1.01,0.7341631889343262
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,4096,1536,8,128,16,4,power_law_1.01,0.34666879177093507
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,4096,1536,8,128,16,4,power_law_1.01,0.9647551536560058
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,4096,1536,8,128,16,4,power_law_1.01,0.4228544235229492
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,4096,1536,8,128,16,4,power_law_1.01,1.0584128379821778
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,4096,1536,8,128,16,4,power_law_1.01,0.5776447772979736
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,4096,1536,8,128,16,4,balanced,0.40968000888824463
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,4096,1536,8,128,16,4,balanced,1.1966933409372966
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,4096,1536,8,128,16,4,power_law_1.01,1.8070144653320312
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,4096,1536,8,128,16,4,power_law_1.01,0.8067584037780762
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,4096,1536,8,128,16,4,power_law_1.01,1.0811391830444337
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,4096,1536,8,128,16,4,power_law_1.01,3.6000640869140623
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,4096,1536,8,128,16,4,power_law_1.01,1.5988096237182616
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,4096,1536,8,128,16,4,power_law_1.01,3.381779098510742
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,4096,1536,8,128,16,4,balanced,0.6039520104726156
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,4096,1536,8,128,16,4,balanced,0.7391680081685384
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,4096,1536,8,128,16,4,power_law_1.2,0.037062400579452516
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,4096,1536,8,128,16,4,balanced,0.9414666493733724
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,4096,1536,8,128,16,4,power_law_1.2,0.03648639917373657
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,4096,1536,8,128,16,4,power_law_1.2,0.03814400136470795
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,4096,1536,8,128,16,4,power_law_1.2,0.04246399998664856
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,4096,1536,8,128,16,4,balanced,2.323808034261068
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,4096,1536,8,128,16,4,power_law_1.2,0.04482559859752655
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,4096,1536,8,128,16,4,power_law_1.2,0.05666559934616089
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,4096,1536,8,128,16,4,power_law_1.2,0.0587007999420166
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,4096,1536,8,128,16,4,power_law_1.2,0.0598143994808197
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,4096,1536,8,128,16,4,power_law_1.2,0.06080639958381653
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,4096,1536,8,128,16,4,power_law_1.2,0.06085119843482971
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,4096,1536,8,128,16,4,power_law_1.2,0.06289280056953431
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,4096,1536,8,128,16,4,power_law_1.2,0.06578559875488281
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,4096,1536,8,128,16,4,balanced,1.4471093813578289
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,4096,1536,8,128,16,4,power_law_1.2,0.06914560198783874
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,4096,1536,8,128,16,4,power_law_1.2,0.033792001008987424
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,4096,1536,8,128,16,4,power_law_1.2,0.07061120271682739
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,4096,1536,8,128,16,4,power_law_1.2,0.035078400373458864
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,4096,1536,8,128,16,4,power_law_1.2,0.0787392020225525
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,4096,1536,8,128,16,4,power_law_1.2,0.03451519906520843
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,4096,1536,8,128,16,4,power_law_1.2,0.08223360180854797
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,4096,1536,8,128,16,4,power_law_1.2,0.03818239867687225
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,4096,1536,8,128,16,4,power_law_1.2,0.04216960072517395
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,4096,1536,8,128,16,4,power_law_1.2,0.0906112015247345
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,4096,1536,8,128,16,4,power_law_1.2,0.04895359873771667
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,4096,1536,8,128,16,4,power_law_1.2,0.11383039951324463
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,4096,1536,8,128,16,4,power_law_1.2,0.05015680193901062
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,4096,1536,8,128,16,4,power_law_1.2,0.12165759801864624
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,4096,1536,8,128,16,4,power_law_1.2,0.05050879716873169
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,4096,1536,8,128,16,4,power_law_1.2,0.1445248007774353
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,4096,1536,8,128,16,4,power_law_1.2,0.052960002422332765
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,4096,1536,8,128,16,4,power_law_1.2,0.15670399665832518
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,4096,1536,8,128,16,4,power_law_1.2,0.0531391978263855
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,4096,1536,8,128,16,4,power_law_1.2,0.23580799102783204
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,4096,1536,8,128,16,4,power_law_1.2,0.057529598474502563
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,4096,1536,8,128,16,4,power_law_1.2,0.3004544019699097
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,4096,1536,8,128,16,4,power_law_1.2,0.06088320016860962
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,4096,1536,8,128,16,4,power_law_1.2,0.06305279731750488
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,4096,1536,8,128,16,4,power_law_1.2,0.3995840072631836
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,4096,1536,8,128,16,4,power_law_1.2,0.06369919776916504
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,4096,1536,8,128,16,4,power_law_1.2,0.48901758193969724
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,4096,1536,8,128,16,4,power_law_1.2,0.07204480171203613
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,4096,1536,8,128,16,4,power_law_1.2,0.6288959980010986
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,4096,1536,8,128,16,4,power_law_1.2,0.08008319735527039
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,4096,1536,8,128,16,4,power_law_1.2,0.09032319784164429
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,4096,1536,8,128,16,4,power_law_1.2,0.9171327590942383
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,4096,1536,8,128,16,4,power_law_1.2,0.10117119550704956
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,4096,1536,8,128,16,4,power_law_1.2,1.243391990661621
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,4096,1536,8,128,16,4,power_law_1.2,0.11192959547042847
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,4096,1536,8,128,16,4,power_law_1.2,0.14251519441604615
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,4096,1536,8,128,16,4,power_law_1.2,2.1840768814086915
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,4096,1536,8,128,16,4,power_law_1.2,0.16427520513534546
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,4096,1536,8,128,16,4,power_law_1.2,0.21742720603942872
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,4096,1536,8,128,16,4,power_law_1.2,4.13966064453125
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,4096,1536,8,128,16,4,power_law_1.2,0.2717695951461792
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,4096,1536,8,128,16,4,power_law_1.2,0.413043212890625
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,4096,1536,8,128,16,4,power_law_1.2,0.5393152236938477
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,4096,1536,8,128,16,4,power_law_1.2,0.8934207916259765
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,4096,1536,8,128,16,4,balanced,2.884906768798828
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,4096,1536,8,128,16,4,power_law_1.2,1.0054911613464355
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,4096,1536,8,128,16,4,power_law_1.2,1.3508031845092774
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,4096,1536,8,128,16,4,power_law_1.2,2.2741119384765627
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,4096,1536,8,128,16,4,power_law_1.2,4.773215866088867
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,4096,1536,8,128,32,2,balanced,0.03696533292531967
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,4096,1536,8,128,32,2,balanced,0.03787733366092046
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,4096,1536,8,128,32,2,balanced,0.042122667034467064
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,4096,1536,8,128,32,2,balanced,0.05008000135421753
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,4096,1536,8,128,32,2,balanced,0.06859200199445088
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,4096,1536,8,128,32,2,balanced,0.07025066514809926
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,4096,1536,8,128,32,2,balanced,0.07072533170382182
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,4096,1536,8,128,32,2,balanced,0.07172800103823344
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,4096,1536,8,128,32,2,balanced,0.03496533383925756
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,4096,1536,8,128,32,2,balanced,0.0720000018676122
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,4096,1536,8,128,32,2,balanced,0.03573333223660787
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,4096,1536,8,128,32,2,balanced,0.0728959987560908
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,4096,1536,8,128,32,2,balanced,0.0415040006240209
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,4096,1536,8,128,32,2,balanced,0.07427200178305308
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,4096,1536,8,128,32,2,balanced,0.07558933397134145
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,4096,1536,8,128,32,2,balanced,0.04868799944718679
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,4096,1536,8,128,32,2,balanced,0.07768533130486806
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,4096,1536,8,128,32,2,balanced,0.06409066418806712
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,4096,1536,8,128,32,2,balanced,0.06367999811967213
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,4096,1536,8,128,32,2,balanced,0.07944533228874207
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,4096,1536,8,128,32,2,balanced,0.06491200129191081
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,4096,1536,8,128,32,2,balanced,0.08318399886290233
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,4096,1536,8,128,32,2,balanced,0.06436266501744588
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,4096,1536,8,128,32,2,balanced,0.08553066849708557
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,4096,1536,8,128,32,2,balanced,0.06586133440335591
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,4096,1536,8,128,32,2,balanced,0.09873066345850627
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,4096,1536,8,128,32,2,balanced,0.06677866478761037
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,4096,1536,8,128,32,2,balanced,0.10960533221562703
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,4096,1536,8,128,32,2,balanced,0.06621866424878438
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,4096,1536,8,128,32,2,balanced,0.12771733601888022
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,4096,1536,8,128,32,2,balanced,0.07026133437951405
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,4096,1536,8,128,32,2,balanced,0.07150400181611379
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,4096,1536,8,128,32,2,balanced,0.15082666277885437
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,4096,1536,8,128,32,2,balanced,0.07613866527875264
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,4096,1536,8,128,32,2,balanced,0.17202132940292358
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,4096,1536,8,128,32,2,balanced,0.08346666892369588
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,4096,1536,8,128,32,2,balanced,0.08711999654769897
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,4096,1536,8,128,32,2,balanced,0.23829867442448935
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,4096,1536,8,128,32,2,balanced,0.10136000315348308
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,4096,1536,8,128,32,2,balanced,0.11130133271217346
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,4096,1536,8,128,32,2,balanced,0.28116265932718915
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,4096,1536,8,128,32,2,balanced,0.1262986660003662
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,4096,1536,8,128,32,2,power_law_1.01,0.03627519905567169
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,4096,1536,8,128,32,2,balanced,0.1516266663869222
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,4096,1536,8,128,32,2,power_law_1.01,0.03651840090751648
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,4096,1536,8,128,32,2,power_law_1.01,0.03992320001125336
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,4096,1536,8,128,32,2,balanced,0.4532693227132161
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,4096,1536,8,128,32,2,power_law_1.01,0.049081599712371825
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,4096,1536,8,128,32,2,balanced,0.18004266421000162
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,4096,1536,8,128,32,2,power_law_1.01,0.053651201725006106
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,4096,1536,8,128,32,2,power_law_1.01,0.06673280000686646
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,4096,1536,8,128,32,2,balanced,0.2597973346710205
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,4096,1536,8,128,32,2,power_law_1.01,0.06869760155677795
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,4096,1536,8,128,32,2,balanced,0.590831995010376
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,4096,1536,8,128,32,2,power_law_1.01,0.07078400254249573
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,4096,1536,8,128,32,2,power_law_1.01,0.06976640224456787
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,4096,1536,8,128,32,2,balanced,0.31813865900039673
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,4096,1536,8,128,32,2,power_law_1.01,0.07192959785461425
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,4096,1536,8,128,32,2,power_law_1.01,0.07433599829673768
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,4096,1536,8,128,32,2,power_law_1.01,0.07707520127296448
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,4096,1536,8,128,32,2,power_law_1.01,0.07948799729347229
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,4096,1536,8,128,32,2,balanced,0.4646559953689575
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,4096,1536,8,128,32,2,power_law_1.01,0.08184959888458251
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,4096,1536,8,128,32,2,balanced,0.8862079779307047
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,4096,1536,8,128,32,2,power_law_1.01,0.09244160056114196
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,4096,1536,8,128,32,2,power_law_1.01,0.09957119822502136
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,4096,1536,8,128,32,2,power_law_1.01,0.10423040390014648
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,4096,1536,8,128,32,2,power_law_1.01,0.12983039617538453
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,4096,1536,8,128,32,2,power_law_1.01,0.14539519548416138
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,4096,1536,8,128,32,2,balanced,0.6602773269017538
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,4096,1536,8,128,32,2,power_law_1.01,0.17142399549484252
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,4096,1536,8,128,32,2,power_law_1.01,0.20638720989227294
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,4096,1536,8,128,32,2,power_law_1.01,0.30202879905700686
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,4096,1536,8,128,32,2,power_law_1.01,0.3314239978790283
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,4096,1536,8,128,32,2,balanced,1.110858678817749
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,4096,1536,8,128,32,2,power_law_1.01,0.47032318115234373
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,4096,1536,8,128,32,2,power_law_1.01,0.6172095775604248
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,4096,1536,8,128,32,2,balanced,1.000106652577718
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,4096,1536,8,128,32,2,power_law_1.01,0.9262784004211426
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,4096,1536,8,128,32,2,power_law_1.01,1.1897919654846192
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,4096,1536,8,128,32,2,power_law_1.01,1.5059391975402832
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,4096,1536,8,128,32,2,power_law_1.01,2.504287910461426
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,4096,1536,8,128,32,2,power_law_1.01,5.0033214569091795
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,4096,1536,8,128,32,2,balanced,1.3964373270670574
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,4096,1536,8,128,32,2,power_law_1.01,0.03492479920387268
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,4096,1536,8,128,32,2,balanced,1.2469013532002766
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,4096,1536,8,128,32,2,power_law_1.01,0.035366401076316833
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,4096,1536,8,128,32,2,power_law_1.01,0.03766399919986725
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,4096,1536,8,128,32,2,power_law_1.01,0.04505600035190582
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,4096,1536,8,128,32,2,power_law_1.01,0.04996480047702789
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,4096,1536,8,128,32,2,power_law_1.01,0.05868160128593445
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,4096,1536,8,128,32,2,power_law_1.01,0.06083199977874756
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,4096,1536,8,128,32,2,power_law_1.01,0.061292797327041626
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,4096,1536,8,128,32,2,power_law_1.01,0.06421120166778564
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,4096,1536,8,128,32,2,power_law_1.2,0.036313599348068236
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,4096,1536,8,128,32,2,balanced,1.5800800323486328
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,4096,1536,8,128,32,2,power_law_1.01,0.0661952018737793
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,4096,1536,8,128,32,2,power_law_1.2,0.03676159977912903
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,4096,1536,8,128,32,2,power_law_1.01,0.06907520294189454
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,4096,1536,8,128,32,2,power_law_1.01,0.07498239874839782
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,4096,1536,8,128,32,2,power_law_1.2,0.04071680009365082
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,4096,1536,8,128,32,2,power_law_1.01,0.08042880296707153
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,4096,1536,8,128,32,2,power_law_1.2,0.04732159972190857
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,4096,1536,8,128,32,2,power_law_1.01,0.0819711983203888
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,4096,1536,8,128,32,2,power_law_1.2,0.05307520031929016
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,4096,1536,8,128,32,2,power_law_1.01,0.09208319783210754
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,4096,1536,8,128,32,2,balanced,2.1620799700419107
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,4096,1536,8,128,32,2,power_law_1.2,0.06743040084838867
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,4096,1536,8,128,32,2,power_law_1.01,0.1044160008430481
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,4096,1536,8,128,32,2,power_law_1.2,0.06862080097198486
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,4096,1536,8,128,32,2,power_law_1.01,0.10603519678115844
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,4096,1536,8,128,32,2,power_law_1.2,0.07059839963912964
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,4096,1536,8,128,32,2,power_law_1.01,0.1293951988220215
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,4096,1536,8,128,32,2,power_law_1.2,0.07264639735221863
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,4096,1536,8,128,32,2,power_law_1.01,0.14485759735107423
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,4096,1536,8,128,32,2,power_law_1.2,0.07303680181503296
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,4096,1536,8,128,32,2,power_law_1.01,0.18008320331573485
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,4096,1536,8,128,32,2,power_law_1.2,0.07542399764060974
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,4096,1536,8,128,32,2,power_law_1.01,0.21214079856872559
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,4096,1536,8,128,32,2,power_law_1.01,0.3055232048034668
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,4096,1536,8,128,32,2,power_law_1.2,0.08090239763259888
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,4096,1536,8,128,32,2,power_law_1.01,0.36046719551086426
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,4096,1536,8,128,32,2,power_law_1.2,0.08036479949951172
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,4096,1536,8,128,32,2,power_law_1.2,0.03460479974746704
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,4096,1536,8,128,32,2,balanced,2.4800853729248047
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,4096,1536,8,128,32,2,power_law_1.01,0.5101183891296387
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,4096,1536,8,128,32,2,power_law_1.2,0.08349440097808838
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,4096,1536,8,128,32,2,power_law_1.2,0.09597439765930176
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,4096,1536,8,128,32,2,power_law_1.01,0.6729536056518555
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,4096,1536,8,128,32,2,power_law_1.2,0.03523840010166168
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,4096,1536,8,128,32,2,power_law_1.2,0.10272639989852905
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,4096,1536,8,128,32,2,power_law_1.01,1.0130623817443847
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,4096,1536,8,128,32,2,power_law_1.2,0.037510401010513304
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,4096,1536,8,128,32,2,power_law_1.2,0.04178560078144074
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,4096,1536,8,128,32,2,power_law_1.2,0.10611840486526489
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,4096,1536,8,128,32,2,power_law_1.01,1.3217151641845704
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,4096,1536,8,128,32,2,power_law_1.2,0.047065600752830505
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,4096,1536,8,128,32,2,power_law_1.2,0.1402176022529602
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,4096,1536,8,128,32,2,power_law_1.01,1.7873727798461914
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,4096,1536,8,128,32,2,power_law_1.2,0.05907840132713318
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,4096,1536,8,128,32,2,power_law_1.2,0.1443519949913025
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,4096,1536,8,128,32,2,power_law_1.01,2.71278076171875
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,4096,1536,8,128,32,2,power_law_1.2,0.06060799956321716
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,4096,1536,8,128,32,2,power_law_1.2,0.18974080085754394
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,4096,1536,8,128,32,2,power_law_1.2,0.06438400149345398
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,4096,1536,8,128,32,2,power_law_1.2,0.20906879901885986
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,4096,1536,8,128,32,2,power_law_1.01,5.834643173217773
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,4096,1536,8,128,32,2,power_law_1.2,0.06542080044746398
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,4096,1536,8,128,32,2,power_law_1.2,0.31233279705047606
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,4096,1536,8,128,32,2,power_law_1.2,0.06673280000686646
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,4096,1536,8,128,32,2,power_law_1.2,0.36878080368041993
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,4096,1536,8,128,32,2,power_law_1.2,0.07216640114784241
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,4096,1536,8,128,32,2,power_law_1.2,0.4942016124725342
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,4096,1536,8,128,32,2,power_law_1.2,0.07598080039024353
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,4096,1536,8,128,32,2,power_law_1.2,0.6774464130401612
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,4096,1536,8,128,32,2,power_law_1.2,0.08265600204467774
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,4096,1536,8,128,32,2,power_law_1.2,0.9564160346984864
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,4096,1536,8,128,32,2,power_law_1.2,0.08314239978790283
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,4096,1536,8,128,32,2,power_law_1.2,1.2541760444641112
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,4096,1536,8,128,32,2,power_law_1.2,0.0987712025642395
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,4096,1536,8,128,32,2,power_law_1.2,0.10337280035018921
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,4096,1536,8,128,32,2,power_law_1.2,1.7329792022705077
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,4096,1536,8,128,32,2,balanced,4.319952011108398
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,4096,1536,8,128,32,2,power_law_1.2,0.1098431944847107
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,4096,1536,8,128,32,2,power_law_1.2,2.708294486999512
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,4096,1536,8,128,32,2,power_law_1.2,0.13352320194244385
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,4096,1536,8,128,32,2,power_law_1.2,0.14249600172042848
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,4096,1536,8,128,32,2,power_law_1.2,5.7816001892089846
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,4096,1536,8,128,32,2,power_law_1.2,0.19040640592575073
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,4096,1536,8,128,32,2,power_law_1.2,0.219596791267395
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,4096,1536,8,128,32,2,power_law_1.2,0.32705280780792234
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,4096,1536,8,128,32,2,power_law_1.2,0.3944000005722046
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,4096,1536,8,128,32,2,balanced,4.955178578694661
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,4096,1536,8,128,32,2,power_law_1.2,0.5577983856201172
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,4096,1536,8,128,32,2,power_law_1.2,0.7374015808105469
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,4096,1536,8,128,32,2,power_law_1.2,1.1043392181396485
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,4096,1536,8,128,32,2,power_law_1.2,1.5857151985168456
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,4096,1536,8,128,32,2,power_law_1.2,1.9850175857543946
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,4096,1536,8,128,32,2,power_law_1.2,3.3385215759277345
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,4096,1536,8,128,32,2,power_law_1.2,6.661081695556641
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,6144,2560,8,160,2,32,balanced,0.06506666541099548
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,6144,2560,8,160,2,32,balanced,0.06173333525657654
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,6144,2560,8,160,2,32,balanced,0.05625600119431814
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,6144,2560,8,160,2,32,balanced,0.06775466601053874
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,6144,2560,8,160,2,32,balanced,0.08999466896057129
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,6144,2560,8,160,2,32,balanced,0.10181333621342976
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,6144,2560,8,160,2,32,balanced,0.10131200154622395
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,6144,2560,8,160,2,32,balanced,0.10400000214576721
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,6144,2560,8,160,2,32,balanced,0.10309333602587382
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,6144,2560,8,160,2,32,balanced,0.10362133383750916
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,6144,2560,8,160,2,32,balanced,0.10414933164914449
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,6144,2560,8,160,2,32,balanced,0.10481066505114238
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,6144,2560,8,160,2,32,balanced,0.10552000006039937
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,6144,2560,8,160,2,32,balanced,0.10886399944623311
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,6144,2560,8,160,2,32,balanced,0.11194133758544922
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,6144,2560,8,160,2,32,balanced,0.11343466242154439
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,6144,2560,8,160,2,32,balanced,0.11621866623560588
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,6144,2560,8,160,2,32,balanced,0.12129599849383037
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,6144,2560,8,160,2,32,balanced,0.12566933035850525
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,6144,2560,8,160,2,32,balanced,0.15732799967130026
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,6144,2560,8,160,2,32,balanced,0.14658666650454202
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,6144,2560,8,160,2,32,balanced,0.0499946673711141
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,6144,2560,8,160,2,32,balanced,0.22137600183486938
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,6144,2560,8,160,2,32,balanced,0.05221866567929586
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,6144,2560,8,160,2,32,balanced,0.0488373339176178
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,6144,2560,8,160,2,32,balanced,0.057349334160486855
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,6144,2560,8,160,2,32,balanced,0.20093866189320883
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,6144,2560,8,160,2,32,balanced,0.07216533521811168
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,6144,2560,8,160,2,32,balanced,0.07737599809964497
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,6144,2560,8,160,2,32,balanced,0.07867200175921123
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,6144,2560,8,160,2,32,balanced,0.07895466685295105
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,6144,2560,8,160,2,32,balanced,0.3114560047785441
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,6144,2560,8,160,2,32,balanced,0.07938133180141449
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,6144,2560,8,160,2,32,balanced,0.08019199967384338
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,6144,2560,8,160,2,32,balanced,0.08253333469231923
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,6144,2560,8,160,2,32,balanced,0.08258133133252461
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,6144,2560,8,160,2,32,balanced,0.08335999647776286
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,6144,2560,8,160,2,32,balanced,0.08567466338475545
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,6144,2560,8,160,2,32,balanced,0.34147198994954425
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,6144,2560,8,160,2,32,balanced,0.09052800138791402
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,6144,2560,8,160,2,32,balanced,0.09238400061925252
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,6144,2560,8,160,2,32,balanced,0.042394667863845825
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,6144,2560,8,160,2,32,balanced,0.09500267108281453
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,6144,2560,8,160,2,32,balanced,0.04313066601753235
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,6144,2560,8,160,2,32,balanced,0.10421866178512573
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,6144,2560,8,160,2,32,balanced,0.04301333427429199
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,6144,2560,8,160,2,32,balanced,0.11098133524258931
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,6144,2560,8,160,2,32,balanced,0.05390933156013489
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,6144,2560,8,160,2,32,balanced,0.06586133440335591
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,6144,2560,8,160,2,32,balanced,0.48188801606496173
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,6144,2560,8,160,2,32,balanced,0.14217066764831543
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,6144,2560,8,160,2,32,balanced,0.07205866773923238
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,6144,2560,8,160,2,32,balanced,0.07292266686757405
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,6144,2560,8,160,2,32,balanced,0.14452800154685974
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,6144,2560,8,160,2,32,balanced,0.0735093355178833
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,6144,2560,8,160,2,32,balanced,0.07397866745789845
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,6144,2560,8,160,2,32,balanced,0.07457066575686137
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,6144,2560,8,160,2,32,balanced,0.19777067502339682
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,6144,2560,8,160,2,32,balanced,0.07619200150171916
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,6144,2560,8,160,2,32,balanced,0.07552533348401387
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,6144,2560,8,160,2,32,power_law_1.01,0.10116480588912964
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,6144,2560,8,160,2,32,power_law_1.01,0.07155839800834655
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,6144,2560,8,160,2,32,balanced,0.07791999975840251
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,6144,2560,8,160,2,32,balanced,0.21549334128697714
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,6144,2560,8,160,2,32,power_law_1.01,0.09264640212059021
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,6144,2560,8,160,2,32,balanced,0.5645440022150675
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,6144,2560,8,160,2,32,power_law_1.01,0.0680512011051178
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,6144,2560,8,160,2,32,balanced,0.07858666777610779
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,6144,2560,8,160,2,32,power_law_1.01,0.06802560091018676
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,6144,2560,8,160,2,32,power_law_1.01,0.05116159915924072
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,6144,2560,8,160,2,32,balanced,0.08367466926574707
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,6144,2560,8,160,2,32,power_law_1.01,0.06455039978027344
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,6144,2560,8,160,2,32,power_law_1.01,0.08179839849472045
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,6144,2560,8,160,2,32,balanced,0.3155893286069234
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,6144,2560,8,160,2,32,power_law_1.01,0.06734079718589783
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,6144,2560,8,160,2,32,power_law_1.01,0.0874239981174469
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,6144,2560,8,160,2,32,power_law_1.01,0.0717631995677948
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,6144,2560,8,160,2,32,power_law_1.01,0.0978879988193512
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,6144,2560,8,160,2,32,power_law_1.01,0.07352319955825806
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,6144,2560,8,160,2,32,balanced,0.08507733543713887
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,6144,2560,8,160,2,32,power_law_1.01,0.0967296004295349
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,6144,2560,8,160,2,32,power_law_1.01,0.07668480277061462
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,6144,2560,8,160,2,32,balanced,0.3729013204574585
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,6144,2560,8,160,2,32,power_law_1.01,0.09763839840888977
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,6144,2560,8,160,2,32,power_law_1.01,0.07089920043945312
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,6144,2560,8,160,2,32,power_law_1.01,0.07767040133476258
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,6144,2560,8,160,2,32,power_law_1.01,0.09956480264663696
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,6144,2560,8,160,2,32,power_law_1.01,0.06737279891967773
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,6144,2560,8,160,2,32,power_law_1.01,0.07998719811439514
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,6144,2560,8,160,2,32,balanced,0.6902613639831543
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,6144,2560,8,160,2,32,power_law_1.01,0.09909120202064514
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,6144,2560,8,160,2,32,power_law_1.01,0.08234879970550538
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,6144,2560,8,160,2,32,power_law_1.01,0.04842880070209503
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,6144,2560,8,160,2,32,power_law_1.01,0.10858240127563476
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,6144,2560,8,160,2,32,power_law_1.2,0.09499520063400269
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,6144,2560,8,160,2,32,balanced,0.08965866764386494
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,6144,2560,8,160,2,32,power_law_1.01,0.0825984001159668
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,6144,2560,8,160,2,32,power_law_1.01,0.059648001194000246
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,6144,2560,8,160,2,32,power_law_1.01,0.11391359567642212
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,6144,2560,8,160,2,32,power_law_1.2,0.06982399821281433
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,6144,2560,8,160,2,32,balanced,0.5359733502070109
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,6144,2560,8,160,2,32,power_law_1.01,0.08836479783058167
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,6144,2560,8,160,2,32,power_law_1.01,0.06155520081520081
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,6144,2560,8,160,2,32,power_law_1.2,0.07264639735221863
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,6144,2560,8,160,2,32,power_law_1.01,0.11419520378112794
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,6144,2560,8,160,2,32,power_law_1.01,0.06939520239830017
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,6144,2560,8,160,2,32,power_law_1.01,0.0908735990524292
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,6144,2560,8,160,2,32,power_law_1.2,0.08246399760246277
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,6144,2560,8,160,2,32,power_law_1.01,0.1168063998222351
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,6144,2560,8,160,2,32,power_law_1.01,0.07282559871673584
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,6144,2560,8,160,2,32,power_law_1.01,0.09757440090179444
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,6144,2560,8,160,2,32,power_law_1.2,0.08047360181808472
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,6144,2560,8,160,2,32,power_law_1.01,0.1298367977142334
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,6144,2560,8,160,2,32,power_law_1.01,0.07525759935379028
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,6144,2560,8,160,2,32,power_law_1.01,0.10166399478912354
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,6144,2560,8,160,2,32,power_law_1.2,0.06965759992599488
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,6144,2560,8,160,2,32,power_law_1.2,0.09991679787635803
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,6144,2560,8,160,2,32,power_law_1.01,0.13468799591064454
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,6144,2560,8,160,2,32,power_law_1.01,0.10257920026779174
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,6144,2560,8,160,2,32,power_law_1.2,0.09813119769096375
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,6144,2560,8,160,2,32,power_law_1.01,0.07652480006217957
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,6144,2560,8,160,2,32,power_law_1.2,0.05801600217819214
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,6144,2560,8,160,2,32,balanced,0.09839466214179993
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,6144,2560,8,160,2,32,power_law_1.01,0.13434239625930786
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,6144,2560,8,160,2,32,power_law_1.2,0.055078399181365964
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,6144,2560,8,160,2,32,power_law_1.2,0.0961023986339569
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,6144,2560,8,160,2,32,power_law_1.01,0.12837120294570922
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,6144,2560,8,160,2,32,power_law_1.01,0.07437440156936645
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,6144,2560,8,160,2,32,power_law_1.01,0.1586176037788391
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,6144,2560,8,160,2,32,power_law_1.2,0.05910400152206421
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,6144,2560,8,160,2,32,balanced,0.10512533783912659
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,6144,2560,8,160,2,32,balanced,0.660810669263204
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,6144,2560,8,160,2,32,power_law_1.2,0.10589439868927002
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,6144,2560,8,160,2,32,power_law_1.01,0.14561920166015624
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,6144,2560,8,160,2,32,power_law_1.01,0.08558080196380616
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,6144,2560,8,160,2,32,power_law_1.2,0.06736000180244446
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,6144,2560,8,160,2,32,power_law_1.01,0.1803712010383606
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,6144,2560,8,160,2,32,power_law_1.2,0.07585279941558838
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,6144,2560,8,160,2,32,power_law_1.2,0.10550400018692016
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,6144,2560,8,160,2,32,power_law_1.01,0.17960959672927856
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,6144,2560,8,160,2,32,power_law_1.01,0.08989440202713013
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,6144,2560,8,160,2,32,power_law_1.2,0.07589120268821717
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,6144,2560,8,160,2,32,power_law_1.01,0.220198392868042
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,6144,2560,8,160,2,32,power_law_1.2,0.11123839616775513
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,6144,2560,8,160,2,32,power_law_1.01,0.20409600734710692
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,6144,2560,8,160,2,32,power_law_1.01,0.09049599766731262
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,6144,2560,8,160,2,32,power_law_1.2,0.0789247989654541
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,6144,2560,8,160,2,32,power_law_1.01,0.24866559505462646
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,6144,2560,8,160,2,32,power_law_1.2,0.08078719973564148
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,6144,2560,8,160,2,32,power_law_1.2,0.11749759912490845
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,6144,2560,8,160,2,32,balanced,0.9940533638000488
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,6144,2560,8,160,2,32,power_law_1.01,0.25832319259643555
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,6144,2560,8,160,2,32,power_law_1.01,0.0927295982837677
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,6144,2560,8,160,2,32,power_law_1.2,0.08134400248527526
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,6144,2560,8,160,2,32,power_law_1.01,0.32413439750671386
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,6144,2560,8,160,2,32,power_law_1.2,0.11845120191574096
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,6144,2560,8,160,2,32,power_law_1.01,0.33851521015167235
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,6144,2560,8,160,2,32,power_law_1.2,0.08208640217781067
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,6144,2560,8,160,2,32,power_law_1.01,0.11051520109176635
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,6144,2560,8,160,2,32,power_law_1.01,0.40297598838806153
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,6144,2560,8,160,2,32,power_law_1.2,0.08881279826164246
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,6144,2560,8,160,2,32,power_law_1.2,0.1244928002357483
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,6144,2560,8,160,2,32,power_law_1.01,0.4169663906097412
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,6144,2560,8,160,2,32,power_law_1.2,0.09208319783210754
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,6144,2560,8,160,2,32,balanced,0.12290666500727336
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,6144,2560,8,160,2,32,power_law_1.01,0.5325632095336914
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,6144,2560,8,160,2,32,power_law_1.2,0.13035520315170288
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,6144,2560,8,160,2,32,power_law_1.2,0.09546239972114563
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,6144,2560,8,160,2,32,power_law_1.01,0.5554880142211914
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,6144,2560,8,160,2,32,power_law_1.01,0.10780160427093506
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,6144,2560,8,160,2,32,power_law_1.2,0.14010239839553834
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,6144,2560,8,160,2,32,power_law_1.2,0.10026240348815918
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,6144,2560,8,160,2,32,power_law_1.01,0.6717184066772461
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,6144,2560,8,160,2,32,balanced,0.8173920313517252
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,6144,2560,8,160,2,32,balanced,0.1368053356806437
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,6144,2560,8,160,2,32,power_law_1.2,0.10901119709014892
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,6144,2560,8,160,2,32,power_law_1.01,0.8044159889221192
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,6144,2560,8,160,2,32,power_law_1.2,0.14026880264282227
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,6144,2560,8,160,2,32,power_law_1.2,0.11255040168762206
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,6144,2560,8,160,2,32,power_law_1.01,0.9888383865356445
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,6144,2560,8,160,2,32,power_law_1.2,0.16881279945373534
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,6144,2560,8,160,2,32,power_law_1.01,1.0190976142883301
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,6144,2560,8,160,2,32,power_law_1.2,0.13766399621963502
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,6144,2560,8,160,2,32,power_law_1.01,0.11484160423278808
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,6144,2560,8,160,2,32,power_law_1.01,1.2212224006652832
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,6144,2560,8,160,2,32,power_law_1.2,0.15616639852523803
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,6144,2560,8,160,2,32,balanced,0.18533867597579956
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,6144,2560,8,160,2,32,power_law_1.2,0.20505599975585936
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,6144,2560,8,160,2,32,power_law_1.01,1.341651153564453
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,6144,2560,8,160,2,32,power_law_1.2,0.20613760948181153
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,6144,2560,8,160,2,32,power_law_1.2,0.24598400592803954
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,6144,2560,8,160,2,32,power_law_1.01,1.4650303840637207
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,6144,2560,8,160,2,32,power_law_1.2,0.22440319061279296
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,6144,2560,8,160,2,32,power_law_1.01,2.0207103729248046
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,6144,2560,8,160,2,32,power_law_1.2,0.30113279819488525
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,6144,2560,8,160,2,32,power_law_1.2,0.3189568042755127
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,6144,2560,8,160,2,32,power_law_1.01,0.14050559997558593
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,6144,2560,8,160,2,32,balanced,0.2118133306503296
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,6144,2560,8,160,2,32,power_law_1.01,2.4144256591796873
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,6144,2560,8,160,2,32,power_law_1.2,0.40405759811401365
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,6144,2560,8,160,2,32,power_law_1.2,0.33471360206604006
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,6144,2560,8,160,2,32,power_law_1.2,0.5796607971191406
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,6144,2560,8,160,2,32,power_law_1.01,0.15882879495620728
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,6144,2560,8,160,2,32,power_law_1.01,4.225523376464844
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,6144,2560,8,160,2,32,power_law_1.2,0.5172544002532959
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,6144,2560,8,160,2,32,power_law_1.2,0.7249599933624268
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,6144,2560,8,160,2,32,power_law_1.01,6.3444160461425785
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,6144,2560,8,160,2,32,power_law_1.2,0.7385216236114502
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,6144,2560,8,160,2,32,power_law_1.2,1.101574420928955
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,6144,2560,8,160,2,32,balanced,0.29261332750320435
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,6144,2560,8,160,2,32,power_law_1.2,1.9208192825317383
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,6144,2560,8,160,2,32,power_law_1.01,0.20060160160064697
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,6144,2560,8,160,2,32,power_law_1.2,0.867955207824707
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,6144,2560,8,160,2,32,power_law_1.2,1.962067222595215
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,6144,2560,8,160,2,32,power_law_1.01,0.22147200107574463
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,6144,2560,8,160,2,32,power_law_1.2,1.4779199600219726
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,6144,2560,8,160,2,32,power_law_1.2,3.599507141113281
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,6144,2560,8,160,2,32,power_law_1.01,0.34145278930664064
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,6144,2560,8,160,2,32,power_law_1.2,1.8350400924682617
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,6144,2560,8,160,2,32,balanced,0.38175467650095624
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,6144,2560,8,160,2,32,power_law_1.2,7.5948738098144535
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,6144,2560,8,160,2,32,balanced,1.2158133188883464
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,6144,2560,8,160,2,32,power_law_1.01,0.4818431854248047
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,6144,2560,8,160,2,32,power_law_1.2,2.232249641418457
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,6144,2560,8,160,2,32,power_law_1.01,0.6220096111297607
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,6144,2560,8,160,2,32,power_law_1.2,4.158323287963867
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,6144,2560,8,160,2,32,power_law_1.01,0.7802879810333252
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,6144,2560,8,160,2,32,power_law_1.01,1.2368255615234376
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,6144,2560,8,160,2,32,power_law_1.2,10.735609436035157
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,6144,2560,8,160,2,32,balanced,0.5319146712621053
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,6144,2560,8,160,2,32,power_law_1.01,1.547916793823242
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,6144,2560,8,160,2,32,balanced,2.045957406361898
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,6144,2560,8,160,2,32,power_law_1.01,2.2040767669677734
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,6144,2560,8,160,2,32,power_law_1.01,2.883296012878418
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,6144,2560,8,160,2,32,balanced,0.6998613675435384
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,6144,2560,8,160,2,32,power_law_1.01,6.890720367431641
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,6144,2560,8,160,2,32,balanced,0.8381973107655843
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,6144,2560,8,160,2,32,balanced,2.397285302480062
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,6144,2560,8,160,2,32,balanced,1.3209546407063801
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,6144,2560,8,160,2,32,balanced,2.6487040519714355
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,6144,2560,8,160,4,16,balanced,0.05171200136343638
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,6144,2560,8,160,4,16,balanced,0.04641599953174591
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,6144,2560,8,160,4,16,balanced,0.05213333169619242
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,6144,2560,8,160,2,32,power_law_1.2,0.07109119892120361
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,6144,2560,8,160,4,16,balanced,0.04785599807898203
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,6144,2560,8,160,4,16,balanced,0.05588266750176748
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,6144,2560,8,160,2,32,power_law_1.2,0.05457280278205871
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,6144,2560,8,160,4,16,balanced,0.06651733318964641
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,6144,2560,8,160,4,16,balanced,0.051072001457214355
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,6144,2560,8,160,4,16,balanced,0.09041600426038106
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,6144,2560,8,160,4,16,balanced,0.05762666463851929
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,6144,2560,8,160,2,32,power_law_1.2,0.048614400625228885
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,6144,2560,8,160,4,16,balanced,0.10046399633089702
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,6144,2560,8,160,4,16,balanced,0.06864533325036366
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,6144,2560,8,160,2,32,power_law_1.2,0.06037120223045349
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,6144,2560,8,160,4,16,balanced,0.10180266698201497
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,6144,2560,8,160,4,16,balanced,0.07728533446788788
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,6144,2560,8,160,2,32,power_law_1.2,0.06269440054893494
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,6144,2560,8,160,4,16,balanced,0.10331199566523235
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,6144,2560,8,160,4,16,balanced,0.07849066456158955
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,6144,2560,8,160,4,16,balanced,0.10319999853769939
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,6144,2560,8,160,2,32,power_law_1.2,0.07251840233802795
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,6144,2560,8,160,4,16,balanced,0.10348266363143921
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,6144,2560,8,160,4,16,balanced,0.07918400069077809
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,6144,2560,8,160,2,32,power_law_1.2,0.07023360133171082
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,6144,2560,8,160,4,16,balanced,0.10611733794212341
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,6144,2560,8,160,4,16,balanced,0.0795413355032603
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,6144,2560,8,160,2,32,power_law_1.2,0.07386239767074584
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,6144,2560,8,160,4,16,balanced,0.10698133707046509
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,6144,2560,8,160,4,16,balanced,0.08078933258851369
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,6144,2560,8,160,2,32,power_law_1.2,0.07507839798927307
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,6144,2560,8,160,4,16,balanced,0.10745066404342651
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,6144,2560,8,160,4,16,power_law_1.01,0.09240959882736206
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,6144,2560,8,160,4,16,balanced,0.04205866654713949
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,6144,2560,8,160,4,16,balanced,0.08145066599051158
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,6144,2560,8,160,2,32,power_law_1.2,0.0840511977672577
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,6144,2560,8,160,4,16,balanced,0.10781866312026978
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,6144,2560,8,160,4,16,balanced,0.08233066896597545
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,6144,2560,8,160,4,16,power_law_1.01,0.08609920144081115
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,6144,2560,8,160,4,16,balanced,0.043103997906049095
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,6144,2560,8,160,2,32,power_law_1.2,0.08712319731712341
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,6144,2560,8,160,4,16,balanced,0.11165866255760193
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,6144,2560,8,160,4,16,balanced,0.08404800295829773
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,6144,2560,8,160,4,16,balanced,0.04340266684691111
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,6144,2560,8,160,4,16,power_law_1.01,0.062028801441192626
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,6144,2560,8,160,2,32,power_law_1.2,0.08986240029335021
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,6144,2560,8,160,4,16,balanced,0.12152000268300374
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,6144,2560,8,160,4,16,balanced,0.05531733234723409
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,6144,2560,8,160,4,16,balanced,0.08578133583068848
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,6144,2560,8,160,4,16,power_law_1.01,0.07096319794654846
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,6144,2560,8,160,4,16,balanced,0.06759466727574666
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,6144,2560,8,160,2,32,power_law_1.2,0.09701120257377624
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,6144,2560,8,160,4,16,balanced,0.11528533697128296
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,6144,2560,8,160,4,16,balanced,0.09063466389973958
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,6144,2560,8,160,4,16,power_law_1.01,0.08098559975624084
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,6144,2560,8,160,4,16,balanced,0.07376533250013988
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,6144,2560,8,160,2,32,power_law_1.2,0.09943040013313294
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,6144,2560,8,160,4,16,balanced,0.09819199641545613
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,6144,2560,8,160,4,16,balanced,0.13261866569519043
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,6144,2560,8,160,4,16,power_law_1.01,0.095551997423172
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,6144,2560,8,160,4,16,balanced,0.07521600027879079
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,6144,2560,8,160,4,16,power_law_1.01,0.07541120052337646
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,6144,2560,8,160,2,32,power_law_1.2,0.1248128056526184
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,6144,2560,8,160,4,16,balanced,0.09679999947547913
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,6144,2560,8,160,4,16,balanced,0.1320799986521403
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,6144,2560,8,160,4,16,power_law_1.01,0.09685760140419006
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,6144,2560,8,160,4,16,balanced,0.07589866717656453
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,6144,2560,8,160,4,16,power_law_1.01,0.06945919990539551
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,6144,2560,8,160,4,16,balanced,0.11889599760373433
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,6144,2560,8,160,4,16,balanced,0.07639466722806294
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,6144,2560,8,160,4,16,power_law_1.01,0.05383679866790771
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,6144,2560,8,160,4,16,power_law_1.01,0.09871360063552856
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,6144,2560,8,160,4,16,balanced,0.1686826745669047
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,6144,2560,8,160,4,16,power_law_1.01,0.05948160290718078
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,6144,2560,8,160,2,32,power_law_1.2,0.1142848014831543
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,6144,2560,8,160,4,16,balanced,0.07746666669845581
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,6144,2560,8,160,4,16,balanced,0.1167626678943634
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,6144,2560,8,160,4,16,power_law_1.01,0.09678720235824585
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,6144,2560,8,160,4,16,power_law_1.01,0.06499199867248535
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,6144,2560,8,160,4,16,balanced,0.1562986671924591
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,6144,2560,8,160,4,16,balanced,0.07831466694672902
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,6144,2560,8,160,4,16,power_law_1.01,0.10083199739456176
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,6144,2560,8,160,4,16,power_law_1.01,0.07308800220489502
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,6144,2560,8,160,4,16,balanced,0.15094400445620218
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,6144,2560,8,160,4,16,power_law_1.01,0.07348480224609374
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,6144,2560,8,160,4,16,balanced,0.07884799937407176
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,6144,2560,8,160,4,16,power_law_1.01,0.11338239908218384
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,6144,2560,8,160,2,32,power_law_1.2,0.12764159440994263
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,6144,2560,8,160,4,16,power_law_1.01,0.07699840068817139
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,6144,2560,8,160,4,16,balanced,0.21815999348958334
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,6144,2560,8,160,4,16,balanced,0.08061866462230682
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,6144,2560,8,160,4,16,balanced,0.15379732847213745
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,6144,2560,8,160,4,16,power_law_1.01,0.0771776020526886
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,6144,2560,8,160,4,16,power_law_1.01,0.11299200057983398
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,6144,2560,8,160,4,16,power_law_1.01,0.07659519910812378
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,6144,2560,8,160,4,16,balanced,0.0822026679913203
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,6144,2560,8,160,4,16,power_law_1.01,0.11366399526596069
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,6144,2560,8,160,4,16,power_law_1.01,0.08098559975624084
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,6144,2560,8,160,2,32,power_law_1.2,0.14542720317840577
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,6144,2560,8,160,4,16,balanced,0.08747733632723491
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,6144,2560,8,160,4,16,balanced,0.21941866477330527
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,6144,2560,8,160,4,16,balanced,0.2201706568400065
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,6144,2560,8,160,4,16,power_law_1.01,0.12324479818344117
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,6144,2560,8,160,4,16,power_law_1.01,0.08364800214767457
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,6144,2560,8,160,4,16,power_law_1.01,0.06592640280723572
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,6144,2560,8,160,2,32,power_law_1.2,0.18880640268325805
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,6144,2560,8,160,4,16,power_law_1.01,0.08583679795265198
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,6144,2560,8,160,4,16,power_law_1.01,0.13365119695663452
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,6144,2560,8,160,4,16,power_law_1.01,0.09395840167999267
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,6144,2560,8,160,4,16,power_law_1.01,0.06899840235710145
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,6144,2560,8,160,4,16,power_law_1.01,0.15109119415283204
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,6144,2560,8,160,4,16,power_law_1.01,0.10154240131378174
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,6144,2560,8,160,4,16,balanced,0.2322453260421753
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,6144,2560,8,160,4,16,balanced,0.3442399899164836
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,6144,2560,8,160,4,16,power_law_1.01,0.04798719882965088
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,6144,2560,8,160,4,16,power_law_1.01,0.11032960414886475
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,6144,2560,8,160,4,16,power_law_1.01,0.1377344012260437
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,6144,2560,8,160,2,32,power_law_1.2,0.24760959148406983
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,6144,2560,8,160,4,16,balanced,0.0902400016784668
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,6144,2560,8,160,4,16,power_law_1.01,0.10984959602355956
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,6144,2560,8,160,4,16,power_law_1.01,0.05847679972648621
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,6144,2560,8,160,4,16,power_law_1.01,0.16158080101013184
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,6144,2560,8,160,2,32,power_law_1.2,0.3638079881668091
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,6144,2560,8,160,4,16,power_law_1.01,0.13760639429092408
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,6144,2560,8,160,4,16,power_law_1.01,0.0627839982509613
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,6144,2560,8,160,4,16,power_law_1.01,0.1393728017807007
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,6144,2560,8,160,4,16,power_law_1.01,0.16650880575180055
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,6144,2560,8,160,4,16,balanced,0.34411199887593585
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,6144,2560,8,160,2,32,power_law_1.2,0.43627519607543946
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,6144,2560,8,160,4,16,power_law_1.01,0.17295360565185547
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,6144,2560,8,160,4,16,power_law_1.01,0.06865919828414917
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,6144,2560,8,160,4,16,power_law_1.01,0.21768319606781006
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,6144,2560,8,160,2,32,power_law_1.2,0.6238016128540039
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,6144,2560,8,160,4,16,balanced,0.38116268316904706
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,6144,2560,8,160,4,16,power_law_1.01,0.19980159997940064
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,6144,2560,8,160,4,16,power_law_1.01,0.07374719977378845
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,6144,2560,8,160,4,16,power_law_1.01,0.22663040161132814
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,6144,2560,8,160,2,32,power_law_1.2,0.8997056007385253
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,6144,2560,8,160,4,16,power_law_1.01,0.25961599349975584
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,6144,2560,8,160,4,16,balanced,0.09586133559544881
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,6144,2560,8,160,4,16,power_law_1.01,0.0754368007183075
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,6144,2560,8,160,4,16,power_law_1.01,0.34425599575042726
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,6144,2560,8,160,4,16,power_law_1.01,0.27998719215393064
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,6144,2560,8,160,2,32,power_law_1.2,1.099289608001709
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,6144,2560,8,160,4,16,power_law_1.01,0.07525119781494141
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,6144,2560,8,160,4,16,balanced,0.40640532970428467
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,6144,2560,8,160,4,16,power_law_1.01,0.4535232067108154
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,6144,2560,8,160,4,16,power_law_1.01,0.35961599349975587
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,6144,2560,8,160,2,32,power_law_1.2,1.7404735565185547
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,6144,2560,8,160,4,16,power_law_1.01,0.0818880021572113
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,6144,2560,8,160,4,16,power_law_1.01,0.5930624008178711
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,6144,2560,8,160,4,16,power_law_1.01,0.455840015411377
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,6144,2560,8,160,4,16,power_law_1.01,0.08037760257720947
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,6144,2560,8,160,4,16,power_law_1.01,0.8486783981323243
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,6144,2560,8,160,4,16,power_law_1.01,0.5299327850341797
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,6144,2560,8,160,4,16,balanced,0.5329813162485758
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,6144,2560,8,160,4,16,power_law_1.01,0.09004799723625183
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,6144,2560,8,160,4,16,power_law_1.01,1.0305472373962403
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,6144,2560,8,160,2,32,power_law_1.2,2.236288070678711
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,6144,2560,8,160,4,16,power_law_1.01,0.8658432006835938
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,6144,2560,8,160,4,16,power_law_1.01,1.2520319938659668
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,6144,2560,8,160,4,16,power_law_1.01,0.09275519847869873
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,6144,2560,8,160,4,16,power_law_1.01,0.10089600086212158
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,6144,2560,8,160,4,16,power_law_1.01,2.2672319412231445
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,6144,2560,8,160,2,32,power_law_1.2,3.1494783401489257
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,6144,2560,8,160,4,16,power_law_1.01,1.0635647773742676
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,6144,2560,8,160,4,16,balanced,0.10777599612871806
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,6144,2560,8,160,4,16,balanced,0.6064960161844889
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,6144,2560,8,160,4,16,power_law_1.01,0.11132160425186158
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,6144,2560,8,160,4,16,power_law_1.01,4.237849426269531
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,6144,2560,8,160,4,16,power_law_1.01,1.262617588043213
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,6144,2560,8,160,2,32,power_law_1.2,5.272614288330078
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,6144,2560,8,160,4,16,balanced,0.11926933129628499
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,6144,2560,8,160,4,16,power_law_1.01,2.096134376525879
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,6144,2560,8,160,4,16,power_law_1.01,0.11099519729614257
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,6144,2560,8,160,2,32,power_law_1.2,12.789132690429687
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,6144,2560,8,160,4,16,balanced,0.6259573300679525
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,6144,2560,8,160,4,16,power_law_1.01,4.2355712890625
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,6144,2560,8,160,4,16,power_law_1.01,0.11528960466384888
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,6144,2560,8,160,4,16,balanced,0.7094613711039225
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,6144,2560,8,160,4,16,balanced,0.14221333463986716
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,6144,2560,8,160,4,16,power_law_1.01,0.14687360525131227
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,6144,2560,8,160,4,16,power_law_1.01,0.16813440322875978
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,6144,2560,8,160,4,16,balanced,0.15946132938067117
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,6144,2560,8,160,4,16,balanced,0.22012799978256226
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,6144,2560,8,160,4,16,power_law_1.01,0.18979840278625487
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,6144,2560,8,160,4,16,balanced,0.7829919656117758
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,6144,2560,8,160,4,16,power_law_1.01,0.2647104024887085
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,6144,2560,8,160,4,16,balanced,0.26915733019510907
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,6144,2560,8,160,4,16,power_law_1.01,0.3486720085144043
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,6144,2560,8,160,4,16,balanced,0.8721226851145426
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,6144,2560,8,160,4,16,power_law_1.01,0.522156810760498
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,6144,2560,8,160,4,16,power_law_1.01,0.7387263774871826
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,6144,2560,8,160,4,16,balanced,0.3914719820022583
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,6144,2560,8,160,4,16,power_law_1.2,0.09264640212059021
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,6144,2560,8,160,4,16,power_law_1.01,0.8802047729492187
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,6144,2560,8,160,4,16,power_law_1.2,0.06553599834442139
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,6144,2560,8,160,4,16,power_law_1.01,1.20382719039917
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,6144,2560,8,160,4,16,power_law_1.2,0.05983359813690185
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,6144,2560,8,160,4,16,power_law_1.2,0.06689919829368592
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,6144,2560,8,160,4,16,balanced,0.5037813186645508
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,6144,2560,8,160,4,16,power_law_1.2,0.07705600261688232
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,6144,2560,8,160,4,16,power_law_1.01,1.7020288467407227
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,6144,2560,8,160,4,16,power_law_1.2,0.09119359850883484
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,6144,2560,8,160,4,16,power_law_1.2,0.0936959981918335
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,6144,2560,8,160,4,16,power_law_1.01,2.0781248092651365
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,6144,2560,8,160,4,16,power_law_1.2,0.0967423975467682
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,6144,2560,8,160,4,16,power_law_1.01,3.1163007736206056
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,6144,2560,8,160,4,16,balanced,1.1278186639149983
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,6144,2560,8,160,4,16,power_law_1.2,0.10340479612350464
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,6144,2560,8,160,4,16,balanced,0.6998826662699381
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,6144,2560,8,160,4,16,power_law_1.2,0.10024319887161255
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,6144,2560,8,160,4,16,power_law_1.01,7.338502502441406
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,6144,2560,8,160,4,16,power_law_1.2,0.1108672022819519
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,6144,2560,8,160,4,16,balanced,1.3257919947306316
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,6144,2560,8,160,4,16,power_law_1.2,0.11382399797439575
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,6144,2560,8,160,4,16,power_law_1.2,0.11259520053863525
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,6144,2560,8,160,4,16,power_law_1.2,0.12511999607086183
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,6144,2560,8,160,4,16,power_law_1.2,0.13490560054779052
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,6144,2560,8,160,4,16,power_law_1.2,0.15831680297851564
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,6144,2560,8,160,4,16,balanced,0.919648011525472
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,6144,2560,8,160,4,16,power_law_1.2,0.15382399559020996
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,6144,2560,8,160,4,16,power_law_1.2,0.16743680238723754
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,6144,2560,8,160,4,16,power_law_1.2,0.18369280099868773
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,6144,2560,8,160,4,16,power_law_1.2,0.25058560371398925
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,6144,2560,8,160,4,16,power_law_1.2,0.24206080436706542
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,6144,2560,8,160,4,16,power_law_1.2,0.347763204574585
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,6144,2560,8,160,4,16,power_law_1.2,0.46085119247436523
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,6144,2560,8,160,4,16,power_law_1.2,0.5960192203521728
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,6144,2560,8,160,4,16,balanced,1.1176213423411052
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,6144,2560,8,160,4,16,power_law_1.2,0.6687424182891846
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,6144,2560,8,160,4,16,power_law_1.2,1.14650239944458
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,6144,2560,8,160,4,16,power_law_1.2,1.0568384170532226
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,6144,2560,8,160,4,16,power_law_1.2,1.8076864242553712
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,6144,2560,8,160,4,16,power_law_1.2,3.0745471954345702
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,6144,2560,8,160,4,16,balanced,2.2223199208577475
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,6144,2560,8,160,4,16,power_law_1.2,6.840275573730469
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,6144,2560,8,160,4,16,balanced,2.6245919863382974
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,6144,2560,8,160,4,16,balanced,1.7536800702412922
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,6144,2560,8,160,4,16,power_law_1.2,0.07517439723014832
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,6144,2560,8,160,4,16,power_law_1.2,0.052851200103759766
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,6144,2560,8,160,4,16,power_law_1.2,0.053235197067260744
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,6144,2560,8,160,4,16,power_law_1.2,0.06778240203857422
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,6144,2560,8,160,4,16,power_law_1.2,0.05766400098800659
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,6144,2560,8,160,4,16,power_law_1.2,0.059564799070358276
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,6144,2560,8,160,4,16,power_law_1.2,0.049209600687026976
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,6144,2560,8,160,4,16,power_law_1.2,0.07158399820327759
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,6144,2560,8,160,4,16,power_law_1.2,0.047443199157714847
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,6144,2560,8,160,8,8,balanced,0.052832002441088356
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,6144,2560,8,160,4,16,balanced,3.497935930887858
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,6144,2560,8,160,4,16,power_law_1.2,0.0732096016407013
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,6144,2560,8,160,4,16,power_law_1.2,0.05631999969482422
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,6144,2560,8,160,8,8,balanced,0.05225066840648651
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,6144,2560,8,160,4,16,power_law_1.2,0.07661439776420594
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,6144,2560,8,160,4,16,power_law_1.2,0.06253439784049988
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,6144,2560,8,160,8,8,balanced,0.05690666536490122
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,6144,2560,8,160,4,16,power_law_1.2,0.07654399871826172
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,6144,2560,8,160,4,16,power_law_1.2,0.06947839856147767
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,6144,2560,8,160,8,8,balanced,0.07256000240643819
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,6144,2560,8,160,4,16,power_law_1.2,0.07964159846305847
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,6144,2560,8,160,4,16,power_law_1.2,0.07322880029678344
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,6144,2560,8,160,8,8,balanced,0.09066133697827657
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,6144,2560,8,160,4,16,power_law_1.2,0.08140799999237061
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,6144,2560,8,160,8,8,balanced,0.10356799761454265
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,6144,2560,8,160,4,16,power_law_1.2,0.07716479897499084
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,6144,2560,8,160,4,16,power_law_1.2,0.08350080251693726
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,6144,2560,8,160,8,8,balanced,0.10517866412798564
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,6144,2560,8,160,4,16,power_law_1.2,0.07724800109863281
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,6144,2560,8,160,4,16,power_law_1.2,0.08592000007629394
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,6144,2560,8,160,8,8,balanced,0.10443733135859172
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,6144,2560,8,160,4,16,power_law_1.2,0.07752320170402527
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,6144,2560,8,160,4,16,power_law_1.2,0.0957759976387024
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,6144,2560,8,160,8,8,balanced,0.10470933715502422
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,6144,2560,8,160,4,16,power_law_1.2,0.08492799997329711
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,6144,2560,8,160,4,16,power_law_1.2,0.10618239641189575
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,6144,2560,8,160,8,8,balanced,0.10612799723943074
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,6144,2560,8,160,4,16,power_law_1.2,0.0915008008480072
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,6144,2560,8,160,4,16,power_law_1.2,0.11885440349578857
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,6144,2560,8,160,8,8,balanced,0.10634133219718933
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,6144,2560,8,160,4,16,power_law_1.2,0.0969215989112854
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,6144,2560,8,160,4,16,power_law_1.2,0.11690239906311035
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,6144,2560,8,160,8,8,balanced,0.109333336353302
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,6144,2560,8,160,4,16,power_law_1.2,0.09863680005073547
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,6144,2560,8,160,4,16,power_law_1.2,0.1398144006729126
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,6144,2560,8,160,8,8,balanced,0.1085599958896637
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,6144,2560,8,160,4,16,power_law_1.2,0.12574080228805543
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,6144,2560,8,160,4,16,power_law_1.2,0.15104000568389891
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,6144,2560,8,160,8,8,balanced,0.1149120032787323
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,6144,2560,8,160,8,8,balanced,0.11760000387827556
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,6144,2560,8,160,4,16,power_law_1.2,0.1871616005897522
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,6144,2560,8,160,8,8,balanced,0.12120532989501953
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,6144,2560,8,160,4,16,power_law_1.2,0.11352959871292115
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,6144,2560,8,160,4,16,power_law_1.2,0.21257600784301758
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,6144,2560,8,160,4,16,power_law_1.2,0.30610558986663816
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,6144,2560,8,160,8,8,balanced,0.12450133760770161
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,6144,2560,8,160,4,16,power_law_1.2,0.39375360012054444
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,6144,2560,8,160,8,8,balanced,0.14593066771825156
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,6144,2560,8,160,8,8,balanced,0.046154667933781944
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,6144,2560,8,160,4,16,power_law_1.2,0.1313088059425354
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,6144,2560,8,160,4,16,power_law_1.2,0.5034751892089844
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,6144,2560,8,160,8,8,balanced,0.1449066698551178
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,6144,2560,8,160,8,8,balanced,0.04717866579691569
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,6144,2560,8,160,4,16,power_law_1.2,0.6730815887451171
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,6144,2560,8,160,8,8,balanced,0.0492799977461497
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,6144,2560,8,160,4,16,power_law_1.2,0.15159679651260377
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,6144,2560,8,160,4,16,power_law_1.2,1.0783424377441406
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,6144,2560,8,160,8,8,balanced,0.1950506567955017
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,6144,2560,8,160,8,8,balanced,0.06044800082842509
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,6144,2560,8,160,4,16,power_law_1.2,0.17651840448379516
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,6144,2560,8,160,4,16,power_law_1.2,1.3701888084411622
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,6144,2560,8,160,8,8,balanced,0.07336000104745229
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,6144,2560,8,160,8,8,balanced,0.176639993985494
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,6144,2560,8,160,8,8,balanced,0.08037866652011871
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,6144,2560,8,160,4,16,power_law_1.2,1.7585151672363282
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,6144,2560,8,160,8,8,balanced,0.08342933654785156
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,6144,2560,8,160,4,16,power_law_1.2,0.24001920223236084
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,6144,2560,8,160,4,16,power_law_1.2,2.8671295166015627
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,6144,2560,8,160,8,8,balanced,0.2670560081799825
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,6144,2560,8,160,8,8,balanced,0.08343467116355896
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,6144,2560,8,160,4,16,power_law_1.2,0.30053119659423827
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,6144,2560,8,160,8,8,balanced,0.08437333504358928
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,6144,2560,8,160,4,16,power_law_1.2,5.6875263214111325
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,6144,2560,8,160,8,8,balanced,0.08424533406893413
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,6144,2560,8,160,4,16,power_law_1.2,0.41146240234375
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,6144,2560,8,160,8,8,balanced,0.259552001953125
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,6144,2560,8,160,8,8,balanced,0.08662399649620056
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,6144,2560,8,160,4,16,power_law_1.2,0.5491712093353271
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,6144,2560,8,160,8,8,balanced,0.08673600355784099
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,6144,2560,8,160,4,16,power_law_1.2,0.795468807220459
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,6144,2560,8,160,8,8,balanced,0.08917333682378133
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,6144,2560,8,160,8,8,balanced,0.40399467945098877
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,6144,2560,8,160,4,16,power_law_1.2,1.1141759872436523
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,6144,2560,8,160,8,8,balanced,0.0913866659005483
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,6144,2560,8,160,4,16,power_law_1.2,1.7921791076660156
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,6144,2560,8,160,8,8,balanced,0.09693866968154907
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,6144,2560,8,160,8,8,balanced,0.10014399886131287
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,6144,2560,8,160,4,16,power_law_1.2,2.3468032836914063
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,6144,2560,8,160,8,8,balanced,0.4538240035374959
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,6144,2560,8,160,8,8,balanced,0.10433066884676616
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,6144,2560,8,160,4,16,power_law_1.2,3.9402496337890627
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,6144,2560,8,160,8,8,balanced,0.12728533148765564
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,6144,2560,8,160,4,16,power_law_1.2,5.2476543426513675
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,6144,2560,8,160,8,8,balanced,0.13004266222318014
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,6144,2560,8,160,4,16,power_law_1.2,11.071097564697265
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,6144,2560,8,160,8,8,balanced,0.17660266160964966
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,6144,2560,8,160,8,8,balanced,0.6482933362325033
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,6144,2560,8,160,8,8,power_law_1.01,0.07073280215263367
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,6144,2560,8,160,8,8,balanced,0.17269333203633627
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,6144,2560,8,160,8,8,power_law_1.01,0.07452160120010376
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,6144,2560,8,160,8,8,power_law_1.01,0.05952640175819397
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,6144,2560,8,160,8,8,balanced,0.24401066700617471
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,6144,2560,8,160,8,8,power_law_1.01,0.07412480115890503
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,6144,2560,8,160,8,8,power_law_1.01,0.07584000229835511
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,6144,2560,8,160,8,8,balanced,0.2717439929644267
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,6144,2560,8,160,8,8,balanced,0.04292266567548116
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,6144,2560,8,160,8,8,power_law_1.01,0.09130880236625671
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,6144,2560,8,160,8,8,power_law_1.01,0.05601919889450073
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,6144,2560,8,160,8,8,balanced,0.8546133041381836
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,6144,2560,8,160,8,8,balanced,0.04517866671085358
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,6144,2560,8,160,8,8,power_law_1.01,0.09678080081939697
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,6144,2560,8,160,8,8,power_law_1.01,0.06119679808616638
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,6144,2560,8,160,8,8,balanced,0.04789333542188009
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,6144,2560,8,160,8,8,balanced,0.4123786687850952
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,6144,2560,8,160,8,8,power_law_1.01,0.09756159782409668
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,6144,2560,8,160,8,8,balanced,0.0584799995024999
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,6144,2560,8,160,8,8,power_law_1.01,0.05170559883117676
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,6144,2560,8,160,8,8,balanced,0.06969599922498067
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,6144,2560,8,160,8,8,power_law_1.01,0.10257279872894287
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,6144,2560,8,160,8,8,power_law_1.01,0.058310401439666745
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,6144,2560,8,160,8,8,balanced,0.07823466757933299
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,6144,2560,8,160,8,8,power_law_1.01,0.06714879870414733
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,6144,2560,8,160,8,8,power_law_1.01,0.1066815972328186
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,6144,2560,8,160,8,8,balanced,0.07984533409277599
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,6144,2560,8,160,8,8,balanced,0.08102400104204814
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,6144,2560,8,160,8,8,power_law_1.01,0.07349119782447815
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,6144,2560,8,160,8,8,power_law_1.01,0.10992640256881714
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,6144,2560,8,160,8,8,balanced,0.4869226614634196
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,6144,2560,8,160,8,8,balanced,0.0812853326400121
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,6144,2560,8,160,8,8,power_law_1.01,0.07760000228881836
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,6144,2560,8,160,8,8,balanced,0.08309866487979889
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,6144,2560,8,160,8,8,power_law_1.01,0.11845120191574096
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,6144,2560,8,160,8,8,balanced,0.08539199829101562
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,6144,2560,8,160,8,8,power_law_1.01,0.07906559705734253
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,6144,2560,8,160,8,8,power_law_1.01,0.12282240390777588
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,6144,2560,8,160,8,8,balanced,0.0865226686000824
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,6144,2560,8,160,8,8,power_law_1.01,0.07861760258674622
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,6144,2560,8,160,8,8,power_law_1.01,0.11299200057983398
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,6144,2560,8,160,8,8,balanced,0.08920533458391826
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,6144,2560,8,160,8,8,balanced,0.9533493518829346
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,6144,2560,8,160,8,8,power_law_1.01,0.08260480165481568
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,6144,2560,8,160,8,8,balanced,0.0925600032011668
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,6144,2560,8,160,8,8,power_law_1.01,0.12095359563827515
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,6144,2560,8,160,8,8,balanced,0.09819733103116353
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,6144,2560,8,160,8,8,power_law_1.01,0.08626559972763062
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,6144,2560,8,160,8,8,power_law_1.01,0.13687039613723756
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,6144,2560,8,160,8,8,balanced,0.6970453262329102
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,6144,2560,8,160,8,8,power_law_1.01,0.09157119989395142
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,6144,2560,8,160,8,8,power_law_1.01,0.14646400213241578
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,6144,2560,8,160,8,8,power_law_1.01,0.09626880288124084
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,6144,2560,8,160,8,8,power_law_1.01,0.17637759447097778
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,6144,2560,8,160,8,8,power_law_1.01,0.09267839789390564
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,6144,2560,8,160,8,8,balanced,0.10420266787211101
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,6144,2560,8,160,8,8,power_law_1.01,0.177401602268219
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,6144,2560,8,160,8,8,power_law_1.01,0.10506240129470826
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,6144,2560,8,160,8,8,power_law_1.01,0.11411839723587036
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,6144,2560,8,160,8,8,power_law_1.01,0.22955520153045655
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,6144,2560,8,160,8,8,power_law_1.01,0.12169599533081055
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,6144,2560,8,160,8,8,power_law_1.01,0.25788800716400145
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,6144,2560,8,160,8,8,power_law_1.01,0.1404096007347107
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,6144,2560,8,160,8,8,balanced,0.11341333389282227
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,6144,2560,8,160,8,8,power_law_1.01,0.30674560070037843
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,6144,2560,8,160,8,8,balanced,0.8977706432342529
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,6144,2560,8,160,8,8,power_law_1.01,0.150873601436615
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,6144,2560,8,160,8,8,power_law_1.01,0.40008959770202634
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,6144,2560,8,160,8,8,power_law_1.01,0.20353920459747316
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,6144,2560,8,160,8,8,power_law_1.01,0.5160064220428466
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,6144,2560,8,160,8,8,power_law_1.01,0.22154879570007324
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,6144,2560,8,160,8,8,power_law_1.01,0.6063168048858643
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,6144,2560,8,160,8,8,power_law_1.01,0.27778561115264894
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,6144,2560,8,160,8,8,power_law_1.01,0.8906815528869629
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,6144,2560,8,160,8,8,balanced,0.13316266735394797
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,6144,2560,8,160,8,8,power_law_1.01,0.40178561210632324
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,6144,2560,8,160,8,8,balanced,1.4679786364237468
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,6144,2560,8,160,8,8,power_law_1.01,0.4874752044677734
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,6144,2560,8,160,8,8,power_law_1.01,1.219814395904541
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,6144,2560,8,160,8,8,balanced,0.14591466387112936
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,6144,2560,8,160,8,8,power_law_1.01,0.6103551864624024
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,6144,2560,8,160,8,8,power_law_1.01,1.4406656265258788
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,6144,2560,8,160,8,8,power_law_1.01,0.9060416221618652
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,6144,2560,8,160,8,8,power_law_1.01,2.2414783477783202
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,6144,2560,8,160,8,8,balanced,1.0608747005462646
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,6144,2560,8,160,8,8,power_law_1.01,1.1553855895996095
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,6144,2560,8,160,8,8,power_law_1.01,4.563455963134766
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,6144,2560,8,160,8,8,power_law_1.01,1.504748821258545
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,6144,2560,8,160,8,8,balanced,0.17969600359598795
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,6144,2560,8,160,8,8,power_law_1.01,2.4024320602416993
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,6144,2560,8,160,8,8,balanced,0.21947733561197916
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,6144,2560,8,160,8,8,power_law_1.01,0.058457601070404056
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,6144,2560,8,160,8,8,power_law_1.01,4.75939826965332
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,6144,2560,8,160,8,8,balanced,0.3304693301518758
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,6144,2560,8,160,8,8,power_law_1.01,0.05966079831123352
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,6144,2560,8,160,8,8,power_law_1.01,0.05041279792785645
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,6144,2560,8,160,8,8,balanced,0.399402658144633
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,6144,2560,8,160,8,8,power_law_1.01,0.05891839861869812
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,6144,2560,8,160,8,8,power_law_1.01,0.06506879925727845
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,6144,2560,8,160,8,8,balanced,0.5688586632410685
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,6144,2560,8,160,8,8,power_law_1.01,0.07482879757881164
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,6144,2560,8,160,8,8,power_law_1.01,0.07834240198135375
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,6144,2560,8,160,8,8,power_law_1.01,0.07948799729347229
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,6144,2560,8,160,8,8,balanced,1.655194600423177
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,6144,2560,8,160,8,8,power_law_1.01,0.08161919713020324
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,6144,2560,8,160,8,8,balanced,0.7411519686381022
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,6144,2560,8,160,8,8,power_law_1.01,0.08487679958343505
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,6144,2560,8,160,8,8,power_law_1.01,0.0889855980873108
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,6144,2560,8,160,8,8,power_law_1.01,0.09496960043907166
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,6144,2560,8,160,8,8,power_law_1.01,0.10566400289535523
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,6144,2560,8,160,8,8,power_law_1.01,0.10973440408706665
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,6144,2560,8,160,8,8,balanced,1.0335413614908855
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,6144,2560,8,160,8,8,power_law_1.01,0.1191167950630188
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,6144,2560,8,160,8,8,balanced,2.7824319203694663
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,6144,2560,8,160,8,8,power_law_1.01,0.12896640300750734
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,6144,2560,8,160,8,8,power_law_1.2,0.06936960220336914
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,6144,2560,8,160,8,8,power_law_1.2,0.06310399770736694
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,6144,2560,8,160,8,8,power_law_1.01,0.13701119422912597
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,6144,2560,8,160,8,8,balanced,1.3776373863220215
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,6144,2560,8,160,8,8,power_law_1.2,0.05785599946975708
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,6144,2560,8,160,8,8,power_law_1.2,0.06649600267410279
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,6144,2560,8,160,8,8,power_law_1.01,0.16324479579925538
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,6144,2560,8,160,8,8,power_law_1.2,0.07352960109710693
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,6144,2560,8,160,8,8,power_law_1.01,0.1817023992538452
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,6144,2560,8,160,8,8,power_law_1.2,0.0920639991760254
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,6144,2560,8,160,8,8,power_law_1.2,0.09639040231704712
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,6144,2560,8,160,8,8,power_law_1.2,0.09909759759902954
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,6144,2560,8,160,8,8,power_law_1.01,0.2544703960418701
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,6144,2560,8,160,8,8,power_law_1.2,0.10611840486526489
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,6144,2560,8,160,8,8,balanced,1.6836907068888347
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,6144,2560,8,160,8,8,power_law_1.01,0.2923392057418823
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,6144,2560,8,160,8,8,power_law_1.2,0.10832639932632446
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,6144,2560,8,160,8,8,power_law_1.2,0.11530239582061767
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,6144,2560,8,160,8,8,power_law_1.01,0.4383232116699219
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,6144,2560,8,160,8,8,power_law_1.2,0.1239359974861145
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,6144,2560,8,160,8,8,power_law_1.01,0.5893760204315186
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,6144,2560,8,160,8,8,balanced,3.217349370320638
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,6144,2560,8,160,8,8,power_law_1.2,0.12501120567321777
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,6144,2560,8,160,8,8,power_law_1.01,0.7989120006561279
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,6144,2560,8,160,8,8,power_law_1.2,0.11627520322799682
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,6144,2560,8,160,8,8,power_law_1.2,0.05627520084381103
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,6144,2560,8,160,8,8,power_law_1.01,1.0236800193786622
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,6144,2560,8,160,8,8,power_law_1.2,0.13345919847488402
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,6144,2560,8,160,8,8,power_law_1.2,0.05195519924163818
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,6144,2560,8,160,8,8,power_law_1.01,1.4420991897583009
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,6144,2560,8,160,8,8,power_law_1.2,0.1344831943511963
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,6144,2560,8,160,8,8,power_law_1.2,0.05047680139541626
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,6144,2560,8,160,8,8,power_law_1.01,2.0926015853881834
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,6144,2560,8,160,8,8,power_law_1.2,0.14741120338439942
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,6144,2560,8,160,8,8,power_law_1.2,0.056454402208328244
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,6144,2560,8,160,8,8,power_law_1.2,0.17473920583724975
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,6144,2560,8,160,8,8,power_law_1.01,2.42803840637207
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,6144,2560,8,160,8,8,power_law_1.2,0.06453120112419128
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,6144,2560,8,160,8,8,power_law_1.2,0.19568639993667603
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,6144,2560,8,160,8,8,power_law_1.2,0.07434239983558655
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,6144,2560,8,160,8,8,power_law_1.01,4.163174438476562
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,6144,2560,8,160,8,8,power_law_1.2,0.24543359279632568
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,6144,2560,8,160,8,8,balanced,2.647162596384684
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,6144,2560,8,160,8,8,power_law_1.2,0.07651200294494628
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,6144,2560,8,160,8,8,power_law_1.2,0.2628607988357544
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,6144,2560,8,160,8,8,power_law_1.01,7.7628929138183596
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,6144,2560,8,160,8,8,power_law_1.2,0.07875840067863464
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,6144,2560,8,160,8,8,power_law_1.2,0.3455679893493652
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,6144,2560,8,160,8,8,power_law_1.2,0.08125439882278443
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,6144,2560,8,160,8,8,power_law_1.2,0.43736958503723145
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,6144,2560,8,160,8,8,power_law_1.2,0.08162559866905213
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,6144,2560,8,160,8,8,power_law_1.2,0.6200895786285401
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,6144,2560,8,160,8,8,power_law_1.2,0.0873856008052826
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,6144,2560,8,160,8,8,power_law_1.2,0.7553919792175293
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,6144,2560,8,160,8,8,power_law_1.2,0.09173120260238647
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,6144,2560,8,160,8,8,power_law_1.2,1.0470975875854491
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,6144,2560,8,160,8,8,power_law_1.2,0.09712640047073365
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,6144,2560,8,160,8,8,power_law_1.2,1.2884223937988282
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,6144,2560,8,160,8,8,power_law_1.2,0.09825279712677001
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,6144,2560,8,160,8,8,power_law_1.2,0.10618239641189575
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,6144,2560,8,160,8,8,power_law_1.2,1.8643455505371094
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,6144,2560,8,160,8,8,power_law_1.2,0.1120576024055481
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,6144,2560,8,160,8,8,power_law_1.2,3.0174335479736327
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,6144,2560,8,160,8,8,power_law_1.2,0.12188160419464111
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,6144,2560,8,160,8,8,power_law_1.2,0.15020159482955933
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,6144,2560,8,160,8,8,power_law_1.2,6.440057373046875
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,6144,2560,8,160,8,8,power_law_1.2,0.15569280385971068
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,6144,2560,8,160,8,8,power_law_1.2,0.21171200275421143
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,6144,2560,8,160,8,8,power_law_1.2,0.23613440990447998
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,6144,2560,8,160,8,8,power_law_1.2,0.291974401473999
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,6144,2560,8,160,8,8,power_law_1.2,0.4044288158416748
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,6144,2560,8,160,8,8,power_law_1.2,0.5844287872314453
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,6144,2560,8,160,8,8,power_law_1.2,0.7474559783935547
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,6144,2560,8,160,8,8,power_law_1.2,1.1182144165039063
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,6144,2560,8,160,8,8,balanced,5.245861371358235
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,6144,2560,8,160,8,8,power_law_1.2,1.3807104110717774
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,6144,2560,8,160,8,8,power_law_1.2,1.9834304809570313
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,6144,2560,8,160,8,8,power_law_1.2,2.849830436706543
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,6144,2560,8,160,8,8,power_law_1.2,6.439180755615235
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,6144,2560,8,160,8,8,power_law_1.2,0.05751680135726929
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,6144,2560,8,160,8,8,power_law_1.2,0.05139200091361999
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,6144,2560,8,160,8,8,power_law_1.2,0.0506816029548645
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,6144,2560,8,160,8,8,power_law_1.2,0.05867519974708557
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,6144,2560,8,160,16,4,balanced,0.0524586687485377
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,6144,2560,8,160,8,8,power_law_1.2,0.06460800170898437
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,6144,2560,8,160,16,4,balanced,0.056186666091283165
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,6144,2560,8,160,8,8,power_law_1.2,0.07154560089111328
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,6144,2560,8,160,16,4,balanced,0.06012799839178721
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,6144,2560,8,160,16,4,balanced,0.0792746643225352
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,6144,2560,8,160,8,8,power_law_1.2,0.07651839852333069
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,6144,2560,8,160,16,4,balanced,0.10172266761461894
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,6144,2560,8,160,8,8,power_law_1.2,0.07902719974517822
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,6144,2560,8,160,16,4,balanced,0.12846400340398154
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,6144,2560,8,160,8,8,power_law_1.2,0.08651520013809204
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,6144,2560,8,160,16,4,balanced,0.12850667039553323
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,6144,2560,8,160,8,8,power_law_1.2,0.0856768012046814
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,6144,2560,8,160,16,4,balanced,0.1143999993801117
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,6144,2560,8,160,8,8,power_law_1.2,0.09210879802703857
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,6144,2560,8,160,16,4,balanced,0.11685333649317424
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,6144,2560,8,160,8,8,power_law_1.2,0.10453120470046998
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,6144,2560,8,160,16,4,balanced,0.11779200037320454
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,6144,2560,8,160,8,8,power_law_1.2,0.10053759813308716
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,6144,2560,8,160,16,4,balanced,0.11876799662907918
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,6144,2560,8,160,8,8,power_law_1.2,0.11322879791259766
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,6144,2560,8,160,16,4,balanced,0.12079999844233195
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,6144,2560,8,160,8,8,power_law_1.2,0.12511359453201293
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,6144,2560,8,160,16,4,balanced,0.12105600039164226
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,6144,2560,8,160,16,4,balanced,0.12657599647839865
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,6144,2560,8,160,8,8,power_law_1.2,0.12762240171432496
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,6144,2560,8,160,16,4,balanced,0.04665066798528036
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,6144,2560,8,160,16,4,balanced,0.13251733779907227
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,6144,2560,8,160,16,4,balanced,0.0505920002857844
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,6144,2560,8,160,16,4,balanced,0.13515200217564902
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,6144,2560,8,160,16,4,balanced,0.05237866441408793
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,6144,2560,8,160,8,8,power_law_1.2,0.1493631958961487
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,6144,2560,8,160,16,4,balanced,0.14063466588656107
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,6144,2560,8,160,16,4,balanced,0.06687999765078227
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,6144,2560,8,160,16,4,balanced,0.17749865849812826
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,6144,2560,8,160,16,4,balanced,0.08134399851163228
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,6144,2560,8,160,8,8,power_law_1.2,0.17256319522857666
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,6144,2560,8,160,16,4,balanced,0.09640533725420634
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,6144,2560,8,160,16,4,balanced,0.1761173407236735
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,6144,2560,8,160,16,4,balanced,0.09867200255393982
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,6144,2560,8,160,8,8,power_law_1.2,0.18580479621887208
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,6144,2560,8,160,16,4,balanced,0.09502399961153667
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,6144,2560,8,160,16,4,balanced,0.24157865842183432
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,6144,2560,8,160,16,4,balanced,0.09532800316810608
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,6144,2560,8,160,8,8,power_law_1.2,0.2753151893615723
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,6144,2560,8,160,16,4,balanced,0.09699199597040813
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,6144,2560,8,160,16,4,balanced,0.09648000200589497
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,6144,2560,8,160,16,4,balanced,0.2314186692237854
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,6144,2560,8,160,8,8,power_law_1.2,0.37292799949645994
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,6144,2560,8,160,16,4,balanced,0.09900800387064616
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,6144,2560,8,160,8,8,power_law_1.2,0.5199168205261231
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,6144,2560,8,160,16,4,balanced,0.10073600212732951
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,6144,2560,8,160,8,8,power_law_1.2,0.6151872158050538
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,6144,2560,8,160,16,4,balanced,0.3516053358713786
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,6144,2560,8,160,16,4,balanced,0.10429333647092183
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,6144,2560,8,160,8,8,power_law_1.2,1.0671680450439454
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,6144,2560,8,160,16,4,balanced,0.11052800218264262
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,6144,2560,8,160,8,8,power_law_1.2,1.2949952125549316
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,6144,2560,8,160,16,4,balanced,0.11412800351778667
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,6144,2560,8,160,16,4,balanced,0.34095466136932373
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,6144,2560,8,160,8,8,power_law_1.2,1.9340351104736329
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,6144,2560,8,160,16,4,balanced,0.12267200152079265
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,6144,2560,8,160,8,8,power_law_1.2,2.2959615707397463
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,6144,2560,8,160,16,4,balanced,0.15755732854207358
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,6144,2560,8,160,16,4,balanced,0.5549120108286539
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,6144,2560,8,160,16,4,balanced,0.05031999945640564
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,6144,2560,8,160,8,8,power_law_1.2,3.253670501708984
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,6144,2560,8,160,16,4,balanced,0.1572480003039042
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,6144,2560,8,160,16,4,balanced,0.053226664662361145
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,6144,2560,8,160,16,4,balanced,0.188917338848114
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,6144,2560,8,160,8,8,power_law_1.2,5.271270370483398
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,6144,2560,8,160,16,4,balanced,0.05518400172392527
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,6144,2560,8,160,16,4,balanced,0.07006399830182393
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,6144,2560,8,160,16,4,balanced,0.21388800938924155
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,6144,2560,8,160,16,4,balanced,0.08582400282224019
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,6144,2560,8,160,8,8,power_law_1.2,13.21294708251953
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,6144,2560,8,160,16,4,balanced,0.6142613490422567
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,6144,2560,8,160,16,4,balanced,0.09461333354314168
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,6144,2560,8,160,16,4,balanced,0.09769066174825032
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,6144,2560,8,160,16,4,balanced,0.09821333487828572
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,6144,2560,8,160,16,4,balanced,0.3064533273379008
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,6144,2560,8,160,16,4,balanced,0.10062399506568909
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,6144,2560,8,160,16,4,power_law_1.01,0.05910400152206421
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,6144,2560,8,160,16,4,balanced,0.10237866640090942
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,6144,2560,8,160,16,4,balanced,0.357589324315389
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,6144,2560,8,160,16,4,power_law_1.01,0.0656063973903656
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,6144,2560,8,160,16,4,balanced,0.9190613428751627
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,6144,2560,8,160,16,4,balanced,0.1063253382841746
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,6144,2560,8,160,16,4,power_law_1.01,0.059494400024414064
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,6144,2560,8,160,16,4,balanced,0.10795199871063232
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,6144,2560,8,160,16,4,power_law_1.01,0.07000960111618042
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,6144,2560,8,160,16,4,balanced,0.11168000102043152
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,6144,2560,8,160,16,4,balanced,0.5286773443222046
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,6144,2560,8,160,16,4,power_law_1.01,0.08294399976730346
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,6144,2560,8,160,16,4,balanced,0.11808533469835918
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,6144,2560,8,160,16,4,power_law_1.01,0.09882879853248597
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,6144,2560,8,160,16,4,balanced,0.1256480018297831
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,6144,2560,8,160,16,4,power_law_1.01,0.10474239587783814
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,6144,2560,8,160,16,4,power_law_1.01,0.05076479911804199
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,6144,2560,8,160,16,4,power_law_1.01,0.10952320098876953
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,6144,2560,8,160,16,4,balanced,0.664352019627889
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,6144,2560,8,160,16,4,power_law_1.01,0.10586240291595458
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,6144,2560,8,160,16,4,power_law_1.01,0.058880001306533813
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,6144,2560,8,160,16,4,balanced,1.1692480246225994
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,6144,2560,8,160,16,4,power_law_1.01,0.11260160207748413
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,6144,2560,8,160,16,4,power_law_1.01,0.053907197713851926
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,6144,2560,8,160,16,4,balanced,0.13667200009028116
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,6144,2560,8,160,16,4,power_law_1.01,0.11904000043869019
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,6144,2560,8,160,16,4,power_law_1.01,0.06340479850769043
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,6144,2560,8,160,16,4,power_law_1.01,0.12232320308685303
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,6144,2560,8,160,16,4,power_law_1.01,0.06661120057106018
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,6144,2560,8,160,16,4,power_law_1.01,0.12616319656372071
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,6144,2560,8,160,16,4,power_law_1.01,0.08291839957237243
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,6144,2560,8,160,16,4,power_law_1.01,0.13893120288848876
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,6144,2560,8,160,16,4,balanced,0.962826649347941
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,6144,2560,8,160,16,4,power_law_1.01,0.08985599875450134
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,6144,2560,8,160,16,4,power_law_1.01,0.14325759410858155
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,6144,2560,8,160,16,4,balanced,0.14829333623250326
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,6144,2560,8,160,16,4,power_law_1.01,0.08887680172920227
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,6144,2560,8,160,16,4,power_law_1.01,0.15292160511016845
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,6144,2560,8,160,16,4,power_law_1.01,0.08833919763565064
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,6144,2560,8,160,16,4,power_law_1.01,0.16844160556793214
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,6144,2560,8,160,16,4,power_law_1.01,0.19901440143585206
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,6144,2560,8,160,16,4,power_law_1.01,0.09200639724731445
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,6144,2560,8,160,16,4,balanced,1.3344747225443523
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,6144,2560,8,160,16,4,power_law_1.01,0.09585919976234436
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,6144,2560,8,160,16,4,power_law_1.01,0.2202687978744507
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,6144,2560,8,160,16,4,balanced,0.18571199973424277
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,6144,2560,8,160,16,4,power_law_1.01,0.10122879743576049
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,6144,2560,8,160,16,4,power_law_1.01,0.26537599563598635
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,6144,2560,8,160,16,4,balanced,0.21733866135279337
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,6144,2560,8,160,16,4,balanced,1.2162826855977376
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,6144,2560,8,160,16,4,power_law_1.01,0.10465279817581177
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,6144,2560,8,160,16,4,power_law_1.01,0.32106881141662597
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,6144,2560,8,160,16,4,power_law_1.01,0.10955519676208496
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,6144,2560,8,160,16,4,power_law_1.01,0.4176767826080322
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,6144,2560,8,160,16,4,balanced,0.2999733289082845
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,6144,2560,8,160,16,4,power_law_1.01,0.12451200485229492
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,6144,2560,8,160,16,4,power_law_1.01,0.49838080406188967
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,6144,2560,8,160,16,4,power_law_1.01,0.12887680530548096
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,6144,2560,8,160,16,4,balanced,0.35889601707458496
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,6144,2560,8,160,16,4,power_law_1.01,0.6790656089782715
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,6144,2560,8,160,16,4,power_law_1.01,0.058246397972106935
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,6144,2560,8,160,16,4,power_law_1.01,0.14228479862213134
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,6144,2560,8,160,16,4,power_law_1.01,0.7986303806304932
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,6144,2560,8,160,16,4,power_law_1.01,0.17099519968032836
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,6144,2560,8,160,16,4,power_law_1.01,0.06020479798316956
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,6144,2560,8,160,16,4,balanced,0.5219146807988485
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,6144,2560,8,160,16,4,power_law_1.01,1.1684096336364747
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,6144,2560,8,160,16,4,power_law_1.01,0.17812479734420777
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,6144,2560,8,160,16,4,power_law_1.01,0.057062399387359616
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,6144,2560,8,160,16,4,power_law_1.01,0.21713919639587403
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,6144,2560,8,160,16,4,power_law_1.01,1.4775487899780273
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,6144,2560,8,160,16,4,power_law_1.01,0.06696959733963012
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,6144,2560,8,160,16,4,power_law_1.2,0.05888640284538269
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,6144,2560,8,160,16,4,balanced,0.6455519994099935
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,6144,2560,8,160,16,4,power_law_1.01,0.26152958869934084
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,6144,2560,8,160,16,4,power_law_1.01,0.07554559707641602
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,6144,2560,8,160,16,4,balanced,1.4466346104939778
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,6144,2560,8,160,16,4,power_law_1.01,1.8514432907104492
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,6144,2560,8,160,16,4,power_law_1.2,0.05797759890556335
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,6144,2560,8,160,16,4,power_law_1.01,0.0889087975025177
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,6144,2560,8,160,16,4,power_law_1.01,0.340774393081665
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,6144,2560,8,160,16,4,balanced,2.117664019266764
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,6144,2560,8,160,16,4,power_law_1.01,2.724287986755371
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,6144,2560,8,160,16,4,power_law_1.2,0.06048640012741089
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,6144,2560,8,160,16,4,power_law_1.01,0.43936638832092284
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,6144,2560,8,160,16,4,power_law_1.01,0.09381759762763978
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,6144,2560,8,160,16,4,balanced,0.9217920303344727
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,6144,2560,8,160,16,4,power_law_1.2,0.07103999853134155
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,6144,2560,8,160,16,4,power_law_1.01,0.5843584060668945
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,6144,2560,8,160,16,4,power_law_1.01,0.09532160162925721
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,6144,2560,8,160,16,4,power_law_1.01,5.3893695831298825
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,6144,2560,8,160,16,4,power_law_1.2,0.08009600043296813
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,6144,2560,8,160,16,4,power_law_1.01,0.09917439818382263
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,6144,2560,8,160,16,4,power_law_1.01,0.7408063888549805
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,6144,2560,8,160,16,4,power_law_1.2,0.10584959983825684
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,6144,2560,8,160,16,4,power_law_1.01,0.10369280576705933
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,6144,2560,8,160,16,4,power_law_1.01,1.082323169708252
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,6144,2560,8,160,16,4,power_law_1.2,0.11347839832305909
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,6144,2560,8,160,16,4,balanced,1.202672004699707
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,6144,2560,8,160,16,4,power_law_1.01,0.11192959547042847
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,6144,2560,8,160,16,4,power_law_1.01,1.398323154449463
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,6144,2560,8,160,16,4,power_law_1.2,0.11037440299987793
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,6144,2560,8,160,16,4,power_law_1.01,0.1214400053024292
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,6144,2560,8,160,16,4,power_law_1.01,1.7434816360473633
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,6144,2560,8,160,16,4,power_law_1.2,0.10960639715194702
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,6144,2560,8,160,16,4,power_law_1.01,0.12603520154953002
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,6144,2560,8,160,16,4,power_law_1.01,2.8247039794921873
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,6144,2560,8,160,16,4,power_law_1.2,0.11012480258941651
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,6144,2560,8,160,16,4,power_law_1.01,0.13808000087738037
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,6144,2560,8,160,16,4,power_law_1.2,0.12002559900283813
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,6144,2560,8,160,16,4,power_law_1.01,0.15407999753952026
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,6144,2560,8,160,16,4,power_law_1.01,5.960710525512695
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,6144,2560,8,160,16,4,balanced,1.7193493843078613
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,6144,2560,8,160,16,4,power_law_1.2,0.12108160257339477
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,6144,2560,8,160,16,4,balanced,2.298133373260498
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,6144,2560,8,160,16,4,power_law_1.2,0.12525440454483033
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,6144,2560,8,160,16,4,power_law_1.01,0.16254080533981324
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,6144,2560,8,160,16,4,power_law_1.2,0.14246400594711303
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,6144,2560,8,160,16,4,power_law_1.2,0.1476096034049988
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,6144,2560,8,160,16,4,power_law_1.01,0.17605760097503662
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,6144,2560,8,160,16,4,power_law_1.2,0.15754239559173583
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,6144,2560,8,160,16,4,power_law_1.2,0.17568000555038452
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,6144,2560,8,160,16,4,balanced,2.280853271484375
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,6144,2560,8,160,16,4,power_law_1.2,0.19423999786376953
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,6144,2560,8,160,16,4,power_law_1.01,0.21329920291900634
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,6144,2560,8,160,16,4,power_law_1.01,0.25742080211639407
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,6144,2560,8,160,16,4,power_law_1.2,0.22249600887298585
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,6144,2560,8,160,16,4,power_law_1.01,0.35431680679321287
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,6144,2560,8,160,16,4,power_law_1.2,0.2678719997406006
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,6144,2560,8,160,16,4,power_law_1.2,0.31420159339904785
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,6144,2560,8,160,16,4,power_law_1.01,0.433241605758667
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,6144,2560,8,160,16,4,power_law_1.01,0.6712255954742432
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,6144,2560,8,160,16,4,power_law_1.2,0.4174079895019531
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,6144,2560,8,160,16,4,power_law_1.2,0.5239871978759766
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,6144,2560,8,160,16,4,power_law_1.01,0.750547218322754
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,6144,2560,8,160,16,4,power_law_1.2,0.7034111976623535
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,6144,2560,8,160,16,4,power_law_1.01,1.0855232238769532
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,6144,2560,8,160,16,4,balanced,4.06876277923584
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,6144,2560,8,160,16,4,power_law_1.2,0.8517760276794434
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,6144,2560,8,160,16,4,balanced,2.7962026596069336
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,6144,2560,8,160,16,4,power_law_1.01,1.5020671844482423
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,6144,2560,8,160,16,4,power_law_1.2,1.3430527687072753
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,6144,2560,8,160,16,4,power_law_1.01,2.036038398742676
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,6144,2560,8,160,16,4,power_law_1.2,1.7178047180175782
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,6144,2560,8,160,16,4,power_law_1.01,3.140390396118164
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,6144,2560,8,160,16,4,power_law_1.2,2.0596736907958983
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,6144,2560,8,160,16,4,power_law_1.01,3.5801406860351563
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,6144,2560,8,160,16,4,power_law_1.2,2.8844032287597656
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,6144,2560,8,160,16,4,power_law_1.01,5.629996871948242
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,6144,2560,8,160,16,4,power_law_1.2,6.637229156494141
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,6144,2560,8,160,16,4,power_law_1.01,12.61932830810547
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,6144,2560,8,160,16,4,balanced,4.490922609965007
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,6144,2560,8,160,16,4,balanced,4.433077176411946
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,6144,2560,8,160,16,4,power_law_1.2,0.0506879985332489
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,6144,2560,8,160,16,4,power_law_1.2,0.05236480236053467
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,6144,2560,8,160,16,4,power_law_1.2,0.05248000025749207
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,6144,2560,8,160,16,4,power_law_1.2,0.06323199868202209
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,6144,2560,8,160,16,4,power_law_1.2,0.06782720088958741
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,6144,2560,8,160,16,4,power_law_1.2,0.0827455997467041
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,6144,2560,8,160,16,4,power_law_1.2,0.09039999842643738
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,6144,2560,8,160,16,4,power_law_1.2,0.08885759711265565
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,6144,2560,8,160,16,4,power_law_1.2,0.0923200011253357
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,6144,2560,8,160,16,4,power_law_1.2,0.09251199960708618
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,6144,2560,8,160,16,4,power_law_1.2,0.09928960204124451
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,6144,2560,8,160,16,4,power_law_1.2,0.10232959985733033
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,6144,2560,8,160,16,4,power_law_1.2,0.10621440410614014
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,6144,2560,8,160,16,4,power_law_1.2,0.11818879842758179
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,6144,2560,8,160,16,4,power_law_1.2,0.1269376039505005
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,6144,2560,8,160,16,4,power_law_1.2,0.13048959970474244
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,6144,2560,8,160,16,4,power_law_1.2,0.14423680305480957
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,6144,2560,8,160,16,4,power_law_1.2,0.17069439888000487
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,6144,2560,8,160,16,4,power_law_1.2,0.1851904034614563
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,6144,2560,8,160,16,4,power_law_1.2,0.22715520858764648
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,6144,2560,8,160,16,4,power_law_1.2,0.275711989402771
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,6144,2560,8,160,16,4,power_law_1.2,0.3692863941192627
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,6144,2560,8,160,16,4,balanced,8.803904215494791
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,6144,2560,8,160,16,4,power_law_1.2,0.4691648006439209
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,6144,2560,8,160,16,4,power_law_1.2,0.6046656131744385
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,6144,2560,8,160,16,4,power_law_1.2,0.8418432235717773
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,6144,2560,8,160,16,4,power_law_1.2,1.2688511848449706
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,6144,2560,8,160,16,4,power_law_1.2,1.5290816307067872
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,6144,2560,8,160,16,4,power_law_1.2,1.822368049621582
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,6144,2560,8,160,16,4,power_law_1.2,3.3497344970703127
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,6144,2560,8,160,16,4,power_law_1.2,7.572345733642578
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,6144,2560,8,160,16,4,power_law_1.2,0.057004797458648684
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,6144,2560,8,160,16,4,power_law_1.2,0.05626239776611328
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,6144,2560,8,160,16,4,power_law_1.2,0.05787519812583923
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,6144,2560,8,160,16,4,power_law_1.2,0.06595199704170226
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,6144,2560,8,160,16,4,power_law_1.2,0.07175679802894593
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,6144,2560,8,160,32,2,balanced,0.053616002202034
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,6144,2560,8,160,16,4,power_law_1.2,0.08665599822998046
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,6144,2560,8,160,32,2,balanced,0.05677333474159241
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,6144,2560,8,160,16,4,power_law_1.2,0.09288319945335388
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,6144,2560,8,160,32,2,balanced,0.06554133196671803
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,6144,2560,8,160,16,4,power_law_1.2,0.09618560075759888
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,6144,2560,8,160,32,2,balanced,0.087909330924352
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,6144,2560,8,160,32,2,balanced,0.11318932970364888
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,6144,2560,8,160,16,4,power_law_1.2,0.10104320049285889
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,6144,2560,8,160,32,2,balanced,0.14147200187047324
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,6144,2560,8,160,16,4,power_law_1.2,0.106278395652771
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,6144,2560,8,160,32,2,balanced,0.14244799812634787
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,6144,2560,8,160,16,4,power_law_1.2,0.11755520105361938
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,6144,2560,8,160,32,2,balanced,0.14029332995414734
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,6144,2560,8,160,16,4,power_law_1.2,0.12168960571289063
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,6144,2560,8,160,32,2,balanced,0.14013333121935526
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,6144,2560,8,160,16,4,power_law_1.2,0.13064320087432862
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,6144,2560,8,160,16,4,power_law_1.2,0.1432255983352661
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,6144,2560,8,160,32,2,balanced,0.14196800192197165
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,6144,2560,8,160,16,4,power_law_1.2,0.16427520513534546
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,6144,2560,8,160,32,2,balanced,0.1435466706752777
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,6144,2560,8,160,32,2,balanced,0.14729066689809164
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,6144,2560,8,160,16,4,power_law_1.2,0.16059520244598388
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,6144,2560,8,160,32,2,balanced,0.14846932888031006
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,6144,2560,8,160,32,2,balanced,0.15528000394503275
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,6144,2560,8,160,16,4,power_law_1.2,0.17745920419692993
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,6144,2560,8,160,32,2,balanced,0.16343999902407327
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,6144,2560,8,160,32,2,balanced,0.1688693364461263
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,6144,2560,8,160,32,2,balanced,0.16964266697565714
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,6144,2560,8,160,16,4,power_law_1.2,0.2275455951690674
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,6144,2560,8,160,16,4,power_law_1.2,0.2797951936721802
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,6144,2560,8,160,32,2,balanced,0.2490346630414327
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,6144,2560,8,160,16,4,power_law_1.2,0.36277759075164795
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,6144,2560,8,160,32,2,balanced,0.04808533191680908
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,6144,2560,8,160,32,2,balanced,0.23399466276168823
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,6144,2560,8,160,16,4,power_law_1.2,0.47679362297058103
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,6144,2560,8,160,32,2,balanced,0.05146666864554087
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,6144,2560,8,160,16,4,power_law_1.2,0.6612927913665771
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,6144,2560,8,160,32,2,balanced,0.30052266518274945
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,6144,2560,8,160,32,2,balanced,0.05667733152707418
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,6144,2560,8,160,16,4,power_law_1.2,0.8553024291992187
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,6144,2560,8,160,32,2,balanced,0.0728000005086263
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,6144,2560,8,160,32,2,balanced,0.3033013343811035
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,6144,2560,8,160,32,2,balanced,0.09703466296195984
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,6144,2560,8,160,16,4,power_law_1.2,1.2596096038818358
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,6144,2560,8,160,32,2,balanced,0.11573333541552226
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,6144,2560,8,160,16,4,power_law_1.2,1.575443172454834
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,6144,2560,8,160,32,2,balanced,0.11668800314267476
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,6144,2560,8,160,32,2,balanced,0.4935946861902873
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,6144,2560,8,160,32,2,balanced,0.11633599797884624
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,6144,2560,8,160,16,4,power_law_1.2,2.2806207656860353
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,6144,2560,8,160,32,2,balanced,0.11918399731318156
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,6144,2560,8,160,32,2,balanced,0.12099200487136841
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,6144,2560,8,160,16,4,power_law_1.2,3.3022079467773438
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,6144,2560,8,160,32,2,balanced,0.5457493464152018
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,6144,2560,8,160,32,2,balanced,0.12316800157229106
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,6144,2560,8,160,16,4,power_law_1.2,4.857791900634766
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,6144,2560,8,160,32,2,balanced,0.12487467130025227
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,6144,2560,8,160,32,2,balanced,0.12838932871818542
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,6144,2560,8,160,16,4,power_law_1.2,6.557644653320312
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,6144,2560,8,160,32,2,power_law_1.01,0.051737600564956666
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,6144,2560,8,160,32,2,balanced,0.13356799880663553
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,6144,2560,8,160,32,2,balanced,0.8245013554890951
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,6144,2560,8,160,32,2,power_law_1.01,0.06288639903068542
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,6144,2560,8,160,32,2,balanced,0.14081066846847534
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,6144,2560,8,160,32,2,power_law_1.01,0.05240319967269898
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,6144,2560,8,160,16,4,power_law_1.2,14.19665985107422
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,6144,2560,8,160,32,2,power_law_1.01,0.05551360249519348
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,6144,2560,8,160,32,2,balanced,0.16088533401489258
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,6144,2560,8,160,32,2,power_law_1.01,0.060127997398376466
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,6144,2560,8,160,32,2,power_law_1.01,0.06558079719543457
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,6144,2560,8,160,32,2,balanced,0.16168000300725302
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,6144,2560,8,160,32,2,power_law_1.01,0.061926400661468504
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,6144,2560,8,160,32,2,power_law_1.01,0.07454079985618592
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,6144,2560,8,160,32,2,balanced,0.24236265818277994
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,6144,2560,8,160,32,2,balanced,1.0138400395711262
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,6144,2560,8,160,32,2,power_law_1.01,0.07434239983558655
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,6144,2560,8,160,32,2,power_law_1.01,0.09479680061340331
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,6144,2560,8,160,32,2,power_law_1.01,0.10170880556106568
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,6144,2560,8,160,32,2,power_law_1.01,0.08828160166740417
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,6144,2560,8,160,32,2,balanced,0.21033066511154175
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,6144,2560,8,160,32,2,power_law_1.01,0.1013375997543335
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,6144,2560,8,160,32,2,power_law_1.01,0.11240960359573364
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,6144,2560,8,160,32,2,power_law_1.01,0.10595200061798096
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,6144,2560,8,160,32,2,balanced,0.26820266246795654
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,6144,2560,8,160,32,2,power_law_1.01,0.11475839614868164
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,6144,2560,8,160,32,2,power_law_1.01,0.11399040222167969
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,6144,2560,8,160,32,2,power_law_1.01,0.1324288010597229
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,6144,2560,8,160,32,2,power_law_1.01,0.12177280187606812
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,6144,2560,8,160,32,2,balanced,0.29241599639256793
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,6144,2560,8,160,32,2,power_law_1.01,0.12865279912948607
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,6144,2560,8,160,32,2,power_law_1.01,0.13320959806442262
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,6144,2560,8,160,32,2,balanced,1.5507253011067708
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,6144,2560,8,160,32,2,power_law_1.01,0.13760000467300415
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,6144,2560,8,160,32,2,power_law_1.01,0.13482240438461304
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,6144,2560,8,160,32,2,balanced,0.4500053326288859
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,6144,2560,8,160,32,2,power_law_1.01,0.1408959984779358
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,6144,2560,8,160,32,2,power_law_1.01,0.14186240434646608
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,6144,2560,8,160,32,2,power_law_1.01,0.15507839918136596
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,6144,2560,8,160,32,2,power_law_1.01,0.1507200002670288
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,6144,2560,8,160,32,2,power_law_1.01,0.17575680017471312
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,6144,2560,8,160,32,2,balanced,0.5387733379999796
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,6144,2560,8,160,32,2,power_law_1.01,0.18245760202407837
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,6144,2560,8,160,32,2,power_law_1.01,0.1561087965965271
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,6144,2560,8,160,32,2,power_law_1.01,0.2346560001373291
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,6144,2560,8,160,32,2,power_law_1.01,0.1559872031211853
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,6144,2560,8,160,32,2,power_law_1.01,0.23463039398193358
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,6144,2560,8,160,32,2,power_law_1.01,0.1685696005821228
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,6144,2560,8,160,32,2,power_law_1.01,0.289247989654541
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,6144,2560,8,160,32,2,power_law_1.01,0.1777791976928711
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,6144,2560,8,160,32,2,balanced,0.8151733080546061
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,6144,2560,8,160,32,2,balanced,1.8002400398254395
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,6144,2560,8,160,32,2,power_law_1.01,0.35395839214324953
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,6144,2560,8,160,32,2,power_law_1.01,0.1889407992362976
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,6144,2560,8,160,32,2,power_law_1.01,0.48664321899414065
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,6144,2560,8,160,32,2,power_law_1.01,0.2523967981338501
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,6144,2560,8,160,32,2,power_law_1.01,0.5989632129669189
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,6144,2560,8,160,32,2,power_law_1.01,0.2519615888595581
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,6144,2560,8,160,32,2,power_law_1.01,0.8305472373962403
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,6144,2560,8,160,32,2,power_law_1.01,0.32355198860168455
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,6144,2560,8,160,32,2,power_law_1.01,1.0863807678222657
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,6144,2560,8,160,32,2,balanced,1.036629358927409
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,6144,2560,8,160,32,2,power_law_1.01,0.39265921115875246
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,6144,2560,8,160,32,2,power_law_1.01,1.549567985534668
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,6144,2560,8,160,32,2,power_law_1.01,1.952467155456543
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,6144,2560,8,160,32,2,power_law_1.01,0.5007359981536865
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,6144,2560,8,160,32,2,power_law_1.01,0.6098495960235596
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,6144,2560,8,160,32,2,power_law_1.01,2.3882944107055666
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,6144,2560,8,160,32,2,power_law_1.01,0.8657600402832031
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,6144,2560,8,160,32,2,power_law_1.01,3.959532928466797
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,6144,2560,8,160,32,2,power_law_1.01,1.1788543701171874
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,6144,2560,8,160,32,2,balanced,2.141050656636556
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,6144,2560,8,160,32,2,balanced,1.5614399909973145
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,6144,2560,8,160,32,2,power_law_1.01,1.6736640930175781
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,6144,2560,8,160,32,2,power_law_1.01,8.025337219238281
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,6144,2560,8,160,32,2,power_law_1.01,2.04968318939209
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,6144,2560,8,160,32,2,power_law_1.01,2.3410175323486326
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,6144,2560,8,160,32,2,power_law_1.01,3.796819305419922
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,6144,2560,8,160,32,2,power_law_1.01,7.9224700927734375
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,6144,2560,8,160,32,2,balanced,1.8677280743916829
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,6144,2560,8,160,32,2,power_law_1.2,0.06279039978981019
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,6144,2560,8,160,32,2,balanced,3.4248905181884766
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,6144,2560,8,160,32,2,power_law_1.2,0.05509759783744812
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,6144,2560,8,160,32,2,power_law_1.2,0.060070401430130003
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,6144,2560,8,160,32,2,power_law_1.2,0.07414399981498718
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,6144,2560,8,160,32,2,power_law_1.2,0.08362240195274354
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,6144,2560,8,160,32,2,balanced,2.262181282043457
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,6144,2560,8,160,32,2,power_law_1.2,0.1091264009475708
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,6144,2560,8,160,32,2,power_law_1.2,0.11271040439605713
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,6144,2560,8,160,32,2,power_law_1.2,0.13216639757156373
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,6144,2560,8,160,32,2,power_law_1.2,0.13556480407714844
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,6144,2560,8,160,32,2,power_law_1.2,0.1392832040786743
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,6144,2560,8,160,32,2,power_law_1.2,0.1465664029121399
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,6144,2560,8,160,32,2,power_law_1.2,0.1523327946662903
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,6144,2560,8,160,32,2,power_law_1.2,0.16020480394363404
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,6144,2560,8,160,32,2,power_law_1.2,0.15987839698791503
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,6144,2560,8,160,32,2,power_law_1.2,0.17522560358047484
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,6144,2560,8,160,32,2,power_law_1.2,0.17982079982757568
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,6144,2560,8,160,32,2,power_law_1.2,0.19979519844055177
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,6144,2560,8,160,32,2,power_law_1.2,0.2586368083953857
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,6144,2560,8,160,32,2,power_law_1.2,0.26127359867095945
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,6144,2560,8,160,32,2,power_law_1.2,0.3414783954620361
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,6144,2560,8,160,32,2,power_law_1.2,0.4075967788696289
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,6144,2560,8,160,32,2,power_law_1.2,0.5355072021484375
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,6144,2560,8,160,32,2,balanced,3.599946657816569
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,6144,2560,8,160,32,2,power_law_1.2,0.631667184829712
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,6144,2560,8,160,32,2,power_law_1.2,0.8776448249816895
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,6144,2560,8,160,32,2,power_law_1.2,1.1748479843139648
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,6144,2560,8,160,32,2,power_law_1.2,1.7279296875
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,6144,2560,8,160,32,2,power_law_1.2,2.196563148498535
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,6144,2560,8,160,32,2,power_law_1.2,2.561849594116211
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,6144,2560,8,160,32,2,power_law_1.2,4.357811355590821
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,6144,2560,8,160,32,2,balanced,6.685509363810222
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,6144,2560,8,160,32,2,power_law_1.2,8.718707275390624
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,6144,2560,8,160,32,2,power_law_1.2,0.0495743989944458
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,6144,2560,8,160,32,2,power_law_1.2,0.05061119794845581
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,6144,2560,8,160,32,2,power_law_1.2,0.05496960282325745
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,6144,2560,8,160,32,2,power_law_1.2,0.06570240259170532
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,6144,2560,8,160,32,2,power_law_1.2,0.0717631995677948
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,6144,2560,8,160,32,2,power_law_1.2,0.0953279972076416
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,6144,2560,8,160,32,2,power_law_1.2,0.10067199468612671
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,6144,2560,8,160,32,2,balanced,7.085215886433919
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,6144,2560,8,160,32,2,power_law_1.2,0.10835200548171997
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,6144,2560,8,160,32,2,power_law_1.2,0.11496319770812988
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,6144,2560,8,160,32,2,power_law_1.2,0.11698559522628785
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,6144,2560,8,160,32,2,power_law_1.2,0.1248960018157959
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,6144,2560,8,160,32,2,power_law_1.2,0.1339840054512024
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,6144,2560,8,160,32,2,power_law_1.2,0.13559039831161498
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,6144,2560,8,160,32,2,power_law_1.2,0.14776959419250488
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,6144,2560,8,160,32,2,power_law_1.2,0.1581055998802185
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,6144,2560,8,160,32,2,power_law_1.2,0.1790336012840271
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,6144,2560,8,160,32,2,power_law_1.2,0.19678720235824584
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,6144,2560,8,160,32,2,power_law_1.2,0.2332672119140625
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,6144,2560,8,160,32,2,power_law_1.2,0.23502719402313232
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,6144,2560,8,160,32,2,power_law_1.2,0.30529921054840087
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,6144,2560,8,160,32,2,power_law_1.2,0.36136960983276367
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,6144,2560,8,160,32,2,power_law_1.2,0.47718400955200196
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,6144,2560,8,160,32,2,power_law_1.2,0.6124608039855957
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,6144,2560,8,160,32,2,power_law_1.2,0.8763392448425293
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,6144,2560,8,160,32,2,power_law_1.2,1.1411520004272462
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,6144,2560,8,160,32,2,power_law_1.2,1.6352703094482421
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,6144,2560,8,160,32,2,power_law_1.2,2.0500288009643555
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,7168,2048,8,384,1,64,balanced,0.1843199928601583
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,7168,2048,8,384,1,64,balanced,0.11640000343322754
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,6144,2560,8,160,32,2,power_law_1.2,2.5139455795288086
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,7168,2048,8,384,1,64,balanced,0.18710933128992716
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,7168,2048,8,384,1,64,balanced,0.11900800466537476
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,6144,2560,8,160,32,2,power_law_1.2,4.614559936523437
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,7168,2048,8,384,1,64,balanced,0.18175999323527017
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,7168,2048,8,384,1,64,balanced,0.12178132931391399
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,7168,2048,8,384,1,64,balanced,0.19131199518839517
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,7168,2048,8,384,1,64,balanced,0.12203733126322429
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,6144,2560,8,160,32,2,power_law_1.2,9.255987548828125
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,7168,2048,8,384,1,64,balanced,0.34672534465789795
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,7168,2048,8,384,1,64,balanced,0.20327999194463095
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,7168,2048,8,384,1,64,balanced,0.6474773486455282
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,7168,2048,8,384,1,64,balanced,0.3683893283208211
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,7168,2048,8,384,1,64,balanced,0.9821440378824869
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,7168,2048,8,384,1,64,balanced,0.5203200181325277
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,7168,2048,8,384,1,64,balanced,1.0000639756520588
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,7168,2048,8,384,1,64,balanced,0.5306133429209391
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,7168,2048,8,384,1,64,balanced,1.0303253332773845
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,7168,2048,8,384,1,64,balanced,0.5682080189387003
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,7168,2048,8,384,1,64,balanced,0.9168480237325033
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,7168,2048,8,384,1,64,balanced,0.523418664932251
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,7168,2048,8,384,1,64,balanced,0.9847040176391602
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,7168,2048,8,384,1,64,balanced,0.545743981997172
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,7168,2048,8,384,1,64,balanced,0.9795520305633545
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,7168,2048,8,384,1,64,balanced,0.5195839802424113
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,7168,2048,8,384,1,64,balanced,1.0265226364135742
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,7168,2048,8,384,1,64,balanced,0.5196746587753296
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,7168,2048,8,384,1,64,balanced,0.9919520219167074
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,7168,2048,8,384,1,64,balanced,0.5037546555201212
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,7168,2048,8,384,1,64,balanced,0.9306293328603109
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,7168,2048,8,384,1,64,balanced,0.5155733426411947
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,7168,2048,8,384,1,64,balanced,0.9577439626057943
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,7168,2048,8,384,1,64,balanced,0.5630133152008057
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,7168,2048,8,384,1,64,balanced,0.05041599770387014
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,7168,2048,8,384,1,64,balanced,0.9369760354359945
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,7168,2048,8,384,1,64,balanced,0.5460906823476156
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,7168,2048,8,384,1,64,balanced,0.05037866532802582
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,7168,2048,8,384,1,64,balanced,0.9217173258463541
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,7168,2048,8,384,1,64,balanced,0.5095359881718954
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,7168,2048,8,384,1,64,balanced,0.05138133466243744
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,7168,2048,8,384,1,64,balanced,0.9609333674112955
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,7168,2048,8,384,1,64,balanced,0.05606933434804281
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,7168,2048,8,384,1,64,balanced,0.5440800189971924
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,7168,2048,8,384,1,64,balanced,0.0666186660528183
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,7168,2048,8,384,1,64,balanced,0.9552799860636393
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,7168,2048,8,384,1,64,balanced,0.08662399649620056
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,7168,2048,8,384,1,64,balanced,0.5423680146535238
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,7168,2048,8,384,1,64,balanced,0.11060800155003865
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,7168,2048,8,384,1,64,balanced,0.9230026404062907
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,7168,2048,8,384,1,64,balanced,0.11129599809646606
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,7168,2048,8,384,1,64,balanced,0.5569813251495361
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,7168,2048,8,384,1,64,balanced,0.11096533139546712
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,7168,2048,8,384,1,64,balanced,0.11152533690134685
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,7168,2048,8,384,1,64,balanced,0.8820160230000814
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,7168,2048,8,384,1,64,balanced,0.5341386795043945
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,7168,2048,8,384,1,64,balanced,0.11337600151697795
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,7168,2048,8,384,1,64,balanced,0.11506133278210957
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,7168,2048,8,384,1,64,balanced,0.11594667037328084
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,7168,2048,8,384,1,64,balanced,0.793503999710083
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,7168,2048,8,384,1,64,balanced,0.5411573251088461
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,7168,2048,8,384,1,64,balanced,0.11689066886901855
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,7168,2048,8,384,1,64,balanced,0.12363732854525249
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,7168,2048,8,384,1,64,balanced,0.12471999724706014
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,7168,2048,8,384,1,64,balanced,0.5641066630681356
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,7168,2048,8,384,1,64,balanced,0.12849066654841104
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,7168,2048,8,384,1,64,balanced,0.4944266478220622
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,7168,2048,8,384,1,64,balanced,0.14040533701578775
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,7168,2048,8,384,1,64,power_law_1.01,0.5472256183624268
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,7168,2048,8,384,1,64,power_law_1.01,0.9819583892822266
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,7168,2048,8,384,1,64,balanced,1.4977386792500813
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,7168,2048,8,384,1,64,power_law_1.01,0.5391744136810303
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,7168,2048,8,384,1,64,balanced,1.0482239723205566
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,7168,2048,8,384,1,64,power_law_1.01,0.964083194732666
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,7168,2048,8,384,1,64,power_law_1.01,0.5171648025512695
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,384,1,64,balanced,0.15100799997647604
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,7168,2048,8,384,1,64,power_law_1.01,0.9870207786560059
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,7168,2048,8,384,1,64,power_law_1.01,0.49553918838500977
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,7168,2048,8,384,1,64,power_law_1.01,0.2543423891067505
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,7168,2048,8,384,1,64,power_law_1.01,0.6869120121002197
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,7168,2048,8,384,1,64,power_law_1.01,0.33425920009613036
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,7168,2048,8,384,1,64,power_law_1.01,0.7505792140960693
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,7168,2048,8,384,1,64,power_law_1.01,0.3938688039779663
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,7168,2048,8,384,1,64,power_law_1.01,0.6458240032196045
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,7168,2048,8,384,1,64,power_law_1.01,0.46900482177734376
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,7168,2048,8,384,1,64,balanced,1.0524213314056396
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,7168,2048,8,384,1,64,power_law_1.01,0.6952447891235352
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,7168,2048,8,384,1,64,balanced,0.9200479984283447
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,7168,2048,8,384,1,64,power_law_1.01,0.4530623912811279
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,7168,2048,8,384,1,64,power_law_1.01,0.9173760414123535
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,7168,2048,8,384,1,64,power_law_1.01,0.9564800262451172
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,7168,2048,8,384,1,64,power_law_1.01,0.5407296180725097
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,384,1,64,balanced,0.17203734318415323
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,7168,2048,8,384,1,64,power_law_1.01,0.9450431823730469
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,7168,2048,8,384,1,64,power_law_1.01,0.5011072158813477
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,7168,2048,8,384,1,64,power_law_1.01,0.8340288162231445
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,7168,2048,8,384,1,64,power_law_1.01,0.45411200523376466
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,384,1,64,balanced,0.18995734055836996
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,7168,2048,8,384,1,64,power_law_1.01,0.8248255729675293
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,7168,2048,8,384,1,64,power_law_1.01,0.4725503921508789
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,7168,2048,8,384,1,64,power_law_1.01,0.862611198425293
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,7168,2048,8,384,1,64,power_law_1.01,0.5256319999694824
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,7168,2048,8,384,1,64,power_law_1.01,0.9376319885253906
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,384,1,64,balanced,0.22296533981959024
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,7168,2048,8,384,1,64,balanced,1.925322691599528
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,7168,2048,8,384,1,64,power_law_1.01,0.4389887809753418
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,7168,2048,8,384,1,64,power_law_1.01,0.8343423843383789
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,7168,2048,8,384,1,64,balanced,1.451514720916748
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,7168,2048,8,384,1,64,power_law_1.01,0.8536576271057129
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,7168,2048,8,384,1,64,power_law_1.01,0.4931136131286621
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,7168,2048,8,384,1,64,power_law_1.01,0.8572223663330079
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,7168,2048,8,384,1,64,power_law_1.01,0.47135357856750487
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,7168,2048,8,384,1,64,power_law_1.01,0.789081621170044
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,7168,2048,8,384,1,64,power_law_1.01,0.11425919532775879
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,7168,2048,8,384,1,64,power_law_1.01,0.45871357917785643
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,7168,2048,8,384,1,64,power_law_1.01,1.00448637008667
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,7168,2048,8,384,1,64,power_law_1.01,0.4862527847290039
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,7168,2048,8,384,1,64,power_law_1.01,1.2477696418762207
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,7168,2048,8,384,1,64,power_law_1.01,0.10398080348968505
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,7168,2048,8,384,1,64,power_law_1.01,0.4868351936340332
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,7168,2048,8,384,1,64,power_law_1.01,1.3269056320190429
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,7168,2048,8,384,1,64,power_law_1.01,0.10209280252456665
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,7168,2048,8,384,1,64,power_law_1.01,1.6025535583496093
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,7168,2048,8,384,1,64,power_law_1.01,0.573203182220459
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,384,1,64,balanced,0.26656534274419147
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,7168,2048,8,384,1,64,power_law_1.01,0.06686080098152161
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,7168,2048,8,384,1,64,power_law_1.01,2.19749755859375
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,7168,2048,8,384,1,64,power_law_1.01,0.6569600105285645
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,7168,2048,8,384,1,64,power_law_1.01,0.07991679906845092
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,7168,2048,8,384,1,64,power_law_1.01,2.6488447189331055
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,7168,2048,8,384,1,64,power_law_1.01,0.8126591682434082
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,7168,2048,8,384,1,64,balanced,2.7098239262898765
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,7168,2048,8,384,1,64,balanced,1.9599520365397136
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,7168,2048,8,384,1,64,power_law_1.01,0.09015039801597595
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,7168,2048,8,384,1,64,power_law_1.01,4.130771255493164
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,7168,2048,8,384,1,64,power_law_1.01,0.9591487884521485
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,384,1,64,balanced,0.33375998338063556
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,7168,2048,8,384,1,64,power_law_1.01,0.09875199794769288
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,7168,2048,8,384,1,64,power_law_1.01,1.1673407554626465
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,7168,2048,8,384,1,64,power_law_1.01,5.576588821411133
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,7168,2048,8,384,1,64,power_law_1.01,0.10246399641036988
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,7168,2048,8,384,1,64,power_law_1.01,1.746931266784668
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,7168,2048,8,384,1,64,power_law_1.01,6.632556915283203
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,7168,2048,8,384,1,64,power_law_1.01,0.1093824028968811
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,7168,2048,8,384,1,64,power_law_1.01,2.240300750732422
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,7168,2048,8,384,1,64,power_law_1.01,10.250508880615234
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,7168,2048,8,384,1,64,power_law_1.01,0.1050879955291748
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,384,1,64,balanced,0.45049067338307697
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,7168,2048,8,384,1,64,power_law_1.01,3.0420480728149415
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,7168,2048,8,384,1,64,power_law_1.01,0.10714880228042603
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,7168,2048,8,384,1,64,power_law_1.01,3.5639873504638673
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,7168,2048,8,384,1,64,power_law_1.01,0.10938880443572999
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,7168,2048,8,384,1,64,power_law_1.01,21.169247436523438
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,7168,2048,8,384,1,64,power_law_1.01,0.12111999988555908
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,7168,2048,8,384,1,64,power_law_1.01,5.993056106567383
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,7168,2048,8,384,1,64,power_law_1.01,0.1254464030265808
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,7168,2048,8,384,1,64,power_law_1.01,0.13388799428939818
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,384,1,64,balanced,0.5928053458531698
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,7168,2048,8,384,1,64,power_law_1.01,0.146560001373291
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,7168,2048,8,384,1,64,power_law_1.01,11.893055725097657
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,7168,2048,8,384,1,64,power_law_1.01,0.1622655987739563
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,7168,2048,8,384,1,64,balanced,3.88590399424235
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,7168,2048,8,384,1,64,power_law_1.01,0.1909119963645935
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,7168,2048,8,384,1,64,balanced,2.84059206644694
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,384,1,64,power_law_1.01,0.19877760410308837
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,7168,2048,8,384,1,64,power_law_1.2,0.9524095535278321
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,384,1,64,power_law_1.01,0.22122879028320314
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,7168,2048,8,384,1,64,power_law_1.2,0.937337589263916
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,384,1,64,power_law_1.01,0.273471999168396
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,384,1,64,balanced,0.8111039797465006
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,7168,2048,8,384,1,64,power_law_1.2,0.9650943756103516
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,384,1,64,power_law_1.01,0.3926271915435791
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,7168,2048,8,384,1,64,power_law_1.2,0.45863680839538573
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,7168,2048,8,384,1,64,power_law_1.2,0.6243648052215576
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,7168,2048,8,384,1,64,power_law_1.2,0.5617856025695801
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,384,1,64,power_law_1.01,0.4574399948120117
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,7168,2048,8,384,1,64,power_law_1.2,0.5783743858337402
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,7168,2048,8,384,1,64,power_law_1.2,0.5274879932403564
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,7168,2048,8,384,1,64,power_law_1.2,0.6809023857116699
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,384,1,64,power_law_1.01,0.5481919765472412
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,7168,2048,8,384,1,64,power_law_1.2,0.47150721549987795
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,7168,2048,8,384,1,64,power_law_1.2,0.8456192016601562
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,384,1,64,power_law_1.01,0.783846378326416
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,7168,2048,8,384,1,64,power_law_1.2,0.25701758861541746
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,7168,2048,8,384,1,64,power_law_1.2,0.778278398513794
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,384,1,64,power_law_1.01,1.1570303916931153
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,7168,2048,8,384,1,64,power_law_1.2,0.3252543926239014
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,7168,2048,8,384,1,64,power_law_1.2,0.8320704460144043
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,7168,2048,8,384,1,64,power_law_1.2,0.35513598918914796
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,384,1,64,power_law_1.01,1.5348416328430177
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,7168,2048,8,384,1,64,power_law_1.2,0.8845248222351074
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,7168,2048,8,384,1,64,power_law_1.2,0.333350396156311
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,384,1,64,balanced,0.9991786479949951
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,7168,2048,8,384,1,64,power_law_1.2,0.8823360443115235
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,7168,2048,8,384,1,64,power_law_1.2,0.39373440742492677
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,384,1,64,power_law_1.01,1.8908735275268556
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,7168,2048,8,384,1,64,power_law_1.2,0.8902400016784668
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,7168,2048,8,384,1,64,power_law_1.2,0.49679999351501464
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,7168,2048,8,384,1,64,power_law_1.2,0.8689984321594239
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,384,1,64,power_law_1.01,2.9641855239868162
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,7168,2048,8,384,1,64,power_law_1.2,0.41146240234375
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,7168,2048,8,384,1,64,power_law_1.2,0.8850111961364746
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,7168,2048,8,384,1,64,power_law_1.2,0.44727678298950196
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,384,1,64,power_law_1.01,6.069926452636719
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,7168,2048,8,384,1,64,power_law_1.2,0.8669119834899902
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,7168,2048,8,384,1,64,power_law_1.2,0.46129279136657714
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,7168,2048,8,384,1,64,power_law_1.2,0.7249407768249512
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,7168,2048,8,384,1,64,balanced,6.625312169392903
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,7168,2048,8,384,1,64,power_law_1.2,0.505299186706543
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,7168,2048,8,384,1,64,balanced,5.155973434448242
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,7168,2048,8,384,1,64,power_law_1.2,0.4961728096008301
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,7168,2048,8,384,1,64,power_law_1.2,0.8692288398742676
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,7168,2048,8,384,1,64,power_law_1.2,0.44671359062194826
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,7168,2048,8,384,1,64,power_law_1.2,0.9887743949890136
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,7168,2048,8,384,1,64,power_law_1.2,0.420684814453125
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,7168,2048,8,384,1,64,power_law_1.2,1.1132736206054688
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,7168,2048,8,384,1,64,power_law_1.2,0.46426239013671877
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,7168,2048,8,384,1,64,power_law_1.2,1.287168025970459
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,384,1,64,balanced,1.5399573644002278
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,7168,2048,8,384,1,64,power_law_1.2,0.48919677734375
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,7168,2048,8,384,1,64,power_law_1.2,1.8021760940551759
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,7168,2048,8,384,1,64,power_law_1.2,0.5626175880432129
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,7168,2048,8,384,1,64,power_law_1.2,2.047942352294922
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,7168,2048,8,384,1,64,power_law_1.2,0.6445184230804444
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,7168,2048,8,384,1,64,power_law_1.2,2.8875200271606447
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,7168,2048,8,384,1,64,power_law_1.2,0.7082560062408447
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,7168,2048,8,384,1,64,power_law_1.2,3.2697982788085938
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,7168,2048,8,384,1,64,power_law_1.2,0.9649920463562012
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,7168,2048,8,384,1,64,power_law_1.2,5.400441741943359
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,7168,2048,8,384,1,64,power_law_1.2,1.2080063819885254
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,7168,2048,8,384,1,64,power_law_1.2,1.5446271896362305
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,7168,2048,8,384,1,64,power_law_1.2,6.325395202636718
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,7168,2048,8,384,1,64,power_law_1.2,1.9977407455444336
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,7168,2048,8,384,1,64,power_law_1.2,9.160185241699219
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,7168,2048,8,384,1,64,power_law_1.2,2.956224060058594
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,7168,2048,8,384,1,64,power_law_1.2,17.16938171386719
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,7168,2048,8,384,1,64,power_law_1.2,4.087321472167969
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,7168,2048,8,384,1,64,power_law_1.2,4.84126091003418
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,7168,2048,8,384,1,64,power_law_1.2,36.748410034179685
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,7168,2048,8,384,1,64,power_law_1.2,8.705677032470703
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,7168,2048,8,384,1,64,power_law_1.2,17.690789794921876
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,384,1,64,balanced,3.0367358525594077
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,7168,2048,8,384,2,32,balanced,0.11031466722488403
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,7168,2048,8,384,2,32,balanced,0.11109866698582967
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,7168,2048,8,384,2,32,balanced,0.11692800124486287
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,7168,2048,8,384,1,64,power_law_1.2,0.11066240072250366
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,7168,2048,8,384,2,32,balanced,0.19969600439071655
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,7168,2048,8,384,1,64,power_law_1.2,0.10484479665756226
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,7168,2048,8,384,2,32,balanced,0.37005865573883057
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,7168,2048,8,384,2,32,balanced,0.6806826591491699
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,7168,2048,8,384,1,64,power_law_1.2,0.09434239864349366
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,7168,2048,8,384,2,32,balanced,0.9920852979024252
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,7168,2048,8,384,1,64,power_law_1.2,0.07337599992752075
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,7168,2048,8,384,2,32,balanced,0.9641760190327963
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,7168,2048,8,384,1,64,power_law_1.2,0.07992960214614868
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,7168,2048,8,384,2,32,balanced,0.9845759868621826
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,7168,2048,8,384,1,64,power_law_1.2,0.07948799729347229
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,7168,2048,8,384,2,32,balanced,0.9826292991638184
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,7168,2048,8,384,1,64,power_law_1.2,0.08513280153274536
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,7168,2048,8,384,2,32,balanced,0.9893866380055746
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,7168,2048,8,384,1,64,power_law_1.2,0.10200320482254029
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,7168,2048,8,384,2,32,balanced,0.9737226963043213
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,7168,2048,8,384,2,32,balanced,0.9930079778035482
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,7168,2048,8,384,1,64,power_law_1.2,0.104038405418396
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,7168,2048,8,384,2,32,balanced,0.9584266344706217
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,7168,2048,8,384,1,64,power_law_1.2,0.10392320156097412
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,7168,2048,8,384,2,32,balanced,0.9612906773885092
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,7168,2048,8,384,1,64,power_law_1.2,0.10216319561004639
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,7168,2048,8,384,2,32,balanced,0.9758933385213217
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,7168,2048,8,384,1,64,power_law_1.2,0.11059839725494384
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,7168,2048,8,384,2,32,balanced,0.919263998667399
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,7168,2048,8,384,1,64,power_law_1.2,0.12371840476989746
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,7168,2048,8,384,2,32,balanced,0.9116960366566976
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,7168,2048,8,384,1,64,power_law_1.2,0.1308735966682434
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,7168,2048,8,384,2,32,balanced,0.9206986427307129
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,7168,2048,8,384,1,64,power_law_1.2,0.14209280014038086
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,7168,2048,8,384,1,64,power_law_1.2,0.148364794254303
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,7168,2048,8,384,2,32,balanced,0.9151626427968343
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,7168,2048,8,384,1,64,power_law_1.2,0.1624127984046936
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,7168,2048,8,384,2,32,balanced,0.9331786632537842
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,7168,2048,8,384,1,64,power_law_1.2,0.21454079151153566
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,7168,2048,8,384,2,32,balanced,0.875162680943807
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,7168,2048,8,384,2,32,balanced,0.07598400115966797
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,384,1,64,power_law_1.2,0.2167423963546753
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,7168,2048,8,384,2,32,balanced,0.07725866635640462
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,7168,2048,8,384,2,32,balanced,0.790293296178182
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,7168,2048,8,384,2,32,balanced,0.07980800171693166
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,7168,2048,8,384,2,32,balanced,0.12948800126711527
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,384,1,64,power_law_1.2,0.24836480617523193
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,7168,2048,8,384,2,32,balanced,0.21944000323613486
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,7168,2048,8,384,2,32,balanced,0.38155198097229004
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,7168,2048,8,384,2,32,power_law_1.01,0.6601024150848389
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,384,1,64,power_law_1.2,0.31002240180969237
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,7168,2048,8,384,2,32,balanced,0.5235146681467692
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,7168,2048,8,384,2,32,balanced,0.6101866563161215
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,384,1,64,power_law_1.2,0.45793919563293456
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,7168,2048,8,384,2,32,balanced,0.5333866675694784
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,7168,2048,8,384,2,32,power_law_1.01,0.9488384246826171
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,7168,2048,8,384,2,32,balanced,0.5699893236160278
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,7168,2048,8,384,2,32,balanced,0.5256959994633993
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,7168,2048,8,384,2,32,power_law_1.01,0.9699071884155274
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,7168,2048,8,384,2,32,balanced,0.5518720149993896
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,7168,2048,8,384,2,32,power_law_1.01,0.295411205291748
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,384,1,64,power_law_1.2,0.5285696029663086
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,7168,2048,8,384,2,32,balanced,0.5628373225529989
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,7168,2048,8,384,2,32,power_law_1.01,0.46513919830322265
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,7168,2048,8,384,2,32,balanced,0.5511840184529623
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,7168,2048,8,384,2,32,balanced,0.04578666885693868
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,7168,2048,8,384,2,32,balanced,1.583936055501302
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,384,1,64,power_law_1.2,0.7385663986206055
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,7168,2048,8,384,2,32,balanced,0.541322668393453
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,7168,2048,8,384,2,32,power_law_1.01,0.5699711799621582
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,7168,2048,8,384,2,32,balanced,0.04692266881465912
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,7168,2048,8,384,2,32,balanced,0.5685173273086548
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,384,1,64,power_law_1.2,1.0067392349243165
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,7168,2048,8,384,2,32,balanced,0.04666133224964142
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,7168,2048,8,384,2,32,power_law_1.01,0.6517312049865722
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,7168,2048,8,384,2,32,balanced,0.5437813202540079
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,7168,2048,8,384,2,32,balanced,0.05266666909058889
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,384,1,64,power_law_1.2,1.3831168174743653
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,7168,2048,8,384,2,32,balanced,0.573306679725647
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,7168,2048,8,384,2,32,power_law_1.01,0.8269696235656738
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,7168,2048,8,384,2,32,balanced,0.06809600194295247
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,7168,2048,8,384,2,32,balanced,0.5494773387908936
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,7168,2048,8,384,2,32,balanced,0.08775466680526733
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,7168,2048,8,384,2,32,power_law_1.01,0.8333056449890137
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,7168,2048,8,384,2,32,balanced,0.5515893300374349
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,7168,2048,8,384,2,32,balanced,0.11081600189208984
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,384,1,64,power_law_1.2,2.3880128860473633
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,7168,2048,8,384,2,32,balanced,1.1632906595865886
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,7168,2048,8,384,2,32,power_law_1.01,0.7903359889984131
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,7168,2048,8,384,2,32,balanced,0.11264000336329143
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,7168,2048,8,384,2,32,balanced,0.5568373203277588
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,7168,2048,8,384,2,32,balanced,0.11308800180753072
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,7168,2048,8,384,2,32,power_law_1.01,0.8702079772949218
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,384,1,64,power_law_1.2,2.400992012023926
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,7168,2048,8,384,2,32,balanced,0.1135040024916331
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,7168,2048,8,384,2,32,balanced,0.5457066694895426
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,7168,2048,8,384,2,32,balanced,0.11515200138092041
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,7168,2048,8,384,2,32,power_law_1.01,0.7781439781188965
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,384,1,64,power_law_1.2,4.805683135986328
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,7168,2048,8,384,2,32,balanced,0.11606933673222859
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,7168,2048,8,384,2,32,balanced,0.5625439882278442
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,7168,2048,8,384,2,32,power_law_1.01,0.7669312000274658
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,7168,2048,8,384,2,32,balanced,0.11755733688672383
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,7168,2048,8,384,2,32,power_law_1.01,0.7940800189971924
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,7168,2048,8,384,2,32,balanced,0.11979732910792033
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,384,1,64,power_law_1.2,8.789862060546875
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,7168,2048,8,384,2,32,balanced,0.5554080009460449
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,7168,2048,8,384,2,32,balanced,0.12531200051307678
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,7168,2048,8,384,2,32,power_law_1.01,0.8373696327209472
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,7168,2048,8,384,2,32,balanced,2.0227200190226235
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,7168,2048,8,384,2,32,balanced,0.12822399536768594
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,7168,2048,8,384,2,32,power_law_1.01,0.39404799938201907
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,7168,2048,8,384,2,32,power_law_1.01,0.8870464324951172
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,7168,2048,8,384,2,32,balanced,0.1323253313700358
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,7168,2048,8,384,2,32,balanced,0.5292319854100546
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,7168,2048,8,384,2,32,power_law_1.01,0.8682047843933105
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,7168,2048,8,384,2,32,power_law_1.01,0.5548416137695312
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,7168,2048,8,384,2,32,balanced,0.14544533689816794
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,7168,2048,8,384,2,32,power_law_1.01,0.7505792140960693
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,7168,2048,8,384,2,32,power_law_1.01,0.557747220993042
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,7168,2048,8,384,2,32,power_law_1.01,0.8575551986694336
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,7168,2048,8,384,2,32,power_law_1.01,0.17456640005111695
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,7168,2048,8,384,2,32,balanced,1.054906686147054
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,7168,2048,8,384,2,32,power_law_1.01,0.9565695762634278
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,7168,2048,8,384,2,32,power_law_1.01,0.255948805809021
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,7168,2048,8,384,2,32,power_law_1.2,0.6609663963317871
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,384,2,32,balanced,0.15965867042541504
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,7168,2048,8,384,2,32,power_law_1.01,0.3577791929244995
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,7168,2048,8,384,2,32,power_law_1.01,1.0639871597290038
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,7168,2048,8,384,2,32,balanced,2.87828795115153
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,7168,2048,8,384,2,32,power_law_1.2,0.9580287933349609
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,7168,2048,8,384,2,32,power_law_1.01,0.3558464050292969
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,7168,2048,8,384,2,32,power_law_1.01,1.2376511573791504
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,7168,2048,8,384,2,32,power_law_1.2,0.7554111957550049
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,7168,2048,8,384,2,32,power_law_1.01,0.0939520001411438
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,7168,2048,8,384,2,32,power_law_1.01,0.40262398719787595
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,7168,2048,8,384,2,32,power_law_1.01,1.521951961517334
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,7168,2048,8,384,2,32,balanced,0.9743573665618896
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,7168,2048,8,384,2,32,power_law_1.2,0.28878719806671144
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,7168,2048,8,384,2,32,power_law_1.01,0.44542717933654785
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,7168,2048,8,384,2,32,power_law_1.01,0.11064319610595703
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,7168,2048,8,384,2,32,power_law_1.01,1.9131584167480469
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,7168,2048,8,384,2,32,power_law_1.2,0.45937280654907225
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,7168,2048,8,384,2,32,power_law_1.01,0.10607999563217163
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,7168,2048,8,384,2,32,power_law_1.01,0.44788479804992676
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,7168,2048,8,384,2,32,power_law_1.01,2.2982719421386717
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,384,2,32,balanced,0.183514674504598
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,7168,2048,8,384,2,32,power_law_1.2,0.4916800022125244
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,7168,2048,8,384,2,32,power_law_1.01,0.061267197132110596
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,7168,2048,8,384,2,32,power_law_1.01,0.47881598472595216
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,7168,2048,8,384,2,32,power_law_1.01,3.1531967163085937
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,7168,2048,8,384,2,32,power_law_1.2,0.5611392021179199
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,7168,2048,8,384,2,32,power_law_1.01,0.0752128005027771
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,384,2,32,balanced,0.20357332626978555
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,7168,2048,8,384,2,32,power_law_1.01,0.4584191799163818
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,7168,2048,8,384,2,32,power_law_1.01,3.8522048950195313
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,7168,2048,8,384,2,32,power_law_1.01,0.08351359963417053
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,7168,2048,8,384,2,32,power_law_1.2,0.7181503772735596
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,7168,2048,8,384,2,32,power_law_1.01,0.4657279968261719
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,7168,2048,8,384,2,32,balanced,1.5228640238444011
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,384,2,32,balanced,0.2405386765797933
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,7168,2048,8,384,2,32,power_law_1.01,0.08280959725379944
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,7168,2048,8,384,2,32,power_law_1.2,0.6901567935943603
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,7168,2048,8,384,2,32,power_law_1.01,0.5035391807556152
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,7168,2048,8,384,2,32,power_law_1.01,4.777920150756836
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,7168,2048,8,384,2,32,power_law_1.01,0.09810559749603272
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,7168,2048,8,384,2,32,power_law_1.2,0.7251776218414306
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,7168,2048,8,384,2,32,power_law_1.01,0.44841599464416504
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,7168,2048,8,384,2,32,power_law_1.01,7.586752319335938
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,7168,2048,8,384,2,32,power_law_1.01,0.10232959985733033
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,7168,2048,8,384,2,32,power_law_1.2,0.7506303787231445
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,7168,2048,8,384,2,32,power_law_1.01,0.502400016784668
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,7168,2048,8,384,2,32,power_law_1.01,0.10376960039138794
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,7168,2048,8,384,2,32,power_law_1.2,0.8705216407775879
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,7168,2048,8,384,2,32,balanced,4.12006409962972
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,7168,2048,8,384,2,32,power_law_1.01,0.5056640148162842
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,7168,2048,8,384,2,32,power_law_1.01,0.09870719909667969
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,7168,2048,8,384,2,32,power_law_1.2,0.7766975879669189
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,7168,2048,8,384,2,32,power_law_1.01,0.4755712032318115
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,7168,2048,8,384,2,32,power_law_1.01,15.021139526367188
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,7168,2048,8,384,2,32,power_law_1.01,0.11100159883499146
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,7168,2048,8,384,2,32,power_law_1.2,0.7740352153778076
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,7168,2048,8,384,2,32,power_law_1.01,0.47128958702087403
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,384,2,32,balanced,0.29258666435877484
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,7168,2048,8,384,2,32,balanced,2.053173383076986
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,7168,2048,8,384,2,32,power_law_1.01,0.10857599973678589
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,7168,2048,8,384,2,32,power_law_1.2,0.8528384208679199
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,7168,2048,8,384,2,32,power_law_1.01,0.5946752071380615
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,7168,2048,8,384,2,32,power_law_1.01,0.11962239742279053
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,7168,2048,8,384,2,32,power_law_1.01,0.6421376228332519
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,7168,2048,8,384,2,32,power_law_1.2,0.8404159545898438
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,7168,2048,8,384,2,32,power_law_1.01,0.12991360425949097
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,7168,2048,8,384,2,32,power_law_1.01,0.75283842086792
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,7168,2048,8,384,2,32,power_law_1.2,0.8071935653686524
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,384,2,32,balanced,0.3710506757100423
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,7168,2048,8,384,2,32,power_law_1.01,0.14145920276641846
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,7168,2048,8,384,2,32,power_law_1.2,0.928831958770752
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,7168,2048,8,384,2,32,power_law_1.01,0.9167615890502929
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,7168,2048,8,384,2,32,power_law_1.01,0.15605759620666504
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,7168,2048,8,384,2,32,power_law_1.2,0.936518383026123
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,7168,2048,8,384,2,32,power_law_1.01,1.1806591987609862
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,7168,2048,8,384,2,32,power_law_1.01,0.18495999574661254
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,7168,2048,8,384,2,32,power_law_1.2,1.0677824020385742
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,7168,2048,8,384,2,32,power_law_1.01,1.5376959800720216
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,7168,2048,8,384,2,32,power_law_1.2,1.202566432952881
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,7168,2048,8,384,2,32,power_law_1.01,2.086886405944824
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,384,2,32,power_law_1.01,0.19824639558792115
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,7168,2048,8,384,2,32,power_law_1.2,1.535257625579834
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,7168,2048,8,384,2,32,power_law_1.01,2.6404287338256838
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,384,2,32,balanced,0.5035253365834554
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,7168,2048,8,384,2,32,power_law_1.2,1.7527807235717774
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,7168,2048,8,384,2,32,power_law_1.01,3.1375616073608397
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,7168,2048,8,384,2,32,power_law_1.2,2.108083152770996
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,384,2,32,power_law_1.01,0.22634239196777345
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,7168,2048,8,384,2,32,balanced,3.0636428197224936
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,7168,2048,8,384,2,32,power_law_1.01,4.86308479309082
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,7168,2048,8,384,2,32,power_law_1.2,2.8859968185424805
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,384,2,32,power_law_1.01,0.27639040946960447
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,384,2,32,power_law_1.01,0.36639358997344973
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,7168,2048,8,384,2,32,power_law_1.2,3.819916915893555
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,7168,2048,8,384,2,32,power_law_1.01,9.840179443359375
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,384,2,32,balanced,0.6839040120442709
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,7168,2048,8,384,2,32,power_law_1.2,4.735001754760742
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,384,2,32,power_law_1.01,0.42696318626403806
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,7168,2048,8,384,2,32,power_law_1.2,6.897357177734375
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,384,2,32,power_law_1.01,0.6463359832763672
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,7168,2048,8,384,2,32,power_law_1.2,10.995782470703125
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,384,2,32,power_law_1.01,0.8345088005065918
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,7168,2048,8,384,2,32,balanced,6.980159759521484
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,384,2,32,power_law_1.01,1.1498496055603027
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,7168,2048,8,384,2,32,power_law_1.2,23.20668182373047
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,384,2,32,balanced,0.9296320279439291
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,384,2,32,power_law_1.01,1.5223999977111817
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,384,2,32,power_law_1.01,1.8584447860717774
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,384,2,32,power_law_1.01,3.0721599578857424
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,384,2,32,power_law_1.01,6.304940795898437
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,384,2,32,balanced,1.144485314687093
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,7168,2048,8,384,2,32,balanced,5.483909606933594
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,7168,2048,8,384,2,32,power_law_1.2,0.39121921062469484
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,384,2,32,balanced,1.7722400029500325
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,7168,2048,8,384,2,32,power_law_1.2,0.5577023983001709
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,7168,2048,8,384,2,32,power_law_1.2,0.47148799896240234
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,7168,2048,8,384,2,32,power_law_1.2,0.17723519802093507
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,7168,2048,8,384,2,32,power_law_1.2,0.22979838848114015
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,7168,2048,8,384,2,32,power_law_1.2,0.3515199899673462
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,7168,2048,8,384,2,32,power_law_1.2,0.32974720001220703
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,7168,2048,8,384,2,32,power_law_1.2,0.4346496105194092
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,7168,2048,8,384,2,32,power_law_1.2,0.4792960166931152
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,7168,2048,8,384,2,32,power_law_1.2,0.409222412109375
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,7168,2048,8,384,2,32,power_law_1.2,0.4132095813751221
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,7168,2048,8,384,2,32,power_law_1.2,0.48657917976379395
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,7168,2048,8,384,2,32,power_law_1.2,0.43401598930358887
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,7168,2048,8,384,2,32,power_law_1.2,0.4534143924713135
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,7168,2048,8,384,2,32,power_law_1.2,0.4972224235534668
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,7168,2048,8,384,2,32,power_law_1.2,0.46627202033996584
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,7168,2048,8,384,2,32,power_law_1.2,0.4486656188964844
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,7168,2048,8,384,2,32,power_law_1.2,0.5293056011199951
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,7168,2048,8,384,2,32,power_law_1.2,0.5188928127288819
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,7168,2048,8,384,2,32,power_law_1.2,0.6272255897521972
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,7168,2048,8,384,2,32,power_law_1.2,0.7438208103179932
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,7168,2048,8,384,2,32,power_law_1.2,0.9278400421142579
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,384,2,32,balanced,3.494842529296875
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,7168,2048,8,384,2,32,power_law_1.2,0.9892671585083008
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,7168,2048,8,384,2,32,power_law_1.2,1.5087295532226563
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,7168,2048,8,384,2,32,power_law_1.2,1.741427230834961
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,7168,2048,8,384,2,32,power_law_1.2,2.827289581298828
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,7168,2048,8,384,2,32,power_law_1.2,3.3003841400146485
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,7168,2048,8,384,2,32,power_law_1.2,0.09366400241851806
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,7168,2048,8,384,2,32,power_law_1.2,3.9703041076660157
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,7168,2048,8,384,2,32,power_law_1.2,0.11028480529785156
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,7168,2048,8,384,2,32,power_law_1.2,0.08909440040588379
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,7168,2048,8,384,2,32,power_law_1.2,6.568198394775391
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,7168,2048,8,384,2,32,power_law_1.2,0.06818559765815735
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,7168,2048,8,384,2,32,power_law_1.2,0.06776319742202759
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,7168,2048,8,384,2,32,power_law_1.2,15.201132202148438
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,7168,2048,8,384,2,32,power_law_1.2,0.07722880244255066
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,7168,2048,8,384,2,32,power_law_1.2,0.08921599984169007
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,7168,2048,8,384,2,32,power_law_1.2,0.09985920190811157
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,7168,2048,8,384,2,32,power_law_1.2,0.09923840165138245
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,7168,2048,8,384,4,16,balanced,0.05653866628805796
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,7168,2048,8,384,2,32,power_law_1.2,0.09809920191764832
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,7168,2048,8,384,4,16,balanced,0.057461331288019814
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,7168,2048,8,384,2,32,power_law_1.2,0.10729600191116333
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,7168,2048,8,384,4,16,balanced,0.057909334699312844
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,7168,2048,8,384,2,32,power_law_1.2,0.10862079858779908
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,7168,2048,8,384,4,16,balanced,0.07019733389218648
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,7168,2048,8,384,2,32,power_law_1.2,0.11662720441818238
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,7168,2048,8,384,4,16,balanced,0.08731200297673543
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,7168,2048,8,384,4,16,balanced,0.12870400150616965
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,7168,2048,8,384,2,32,power_law_1.2,0.12222720384597778
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,7168,2048,8,384,4,16,balanced,0.1713119943936666
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,7168,2048,8,384,4,16,balanced,0.048058668772379555
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,7168,2048,8,384,2,32,power_law_1.2,0.13414399623870848
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,7168,2048,8,384,4,16,balanced,0.1686826745669047
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,7168,2048,8,384,4,16,balanced,0.0495306650797526
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,7168,2048,8,384,2,32,power_law_1.2,0.14485119581222533
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,7168,2048,8,384,4,16,balanced,0.16953599452972412
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,7168,2048,8,384,4,16,balanced,0.053946668903032936
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,7168,2048,8,384,2,32,power_law_1.2,0.16012799739837646
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,7168,2048,8,384,4,16,balanced,0.1702773372332255
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,7168,2048,8,384,4,16,balanced,0.05772800246874491
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,7168,2048,8,384,4,16,balanced,0.1673120061556498
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,7168,2048,8,384,2,32,power_law_1.2,0.19866880178451538
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,7168,2048,8,384,4,16,balanced,0.07060266534487407
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,7168,2048,8,384,4,16,balanced,0.17453867197036743
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,7168,2048,8,384,4,16,balanced,0.09220799803733826
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,7168,2048,8,384,4,16,balanced,0.1803413430849711
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,7168,2048,8,384,4,16,balanced,0.11537599563598633
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,384,2,32,power_law_1.2,0.23233280181884766
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,7168,2048,8,384,4,16,balanced,0.1742239991823832
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,7168,2048,8,384,4,16,balanced,0.11636799573898315
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,7168,2048,8,384,4,16,balanced,0.18290666739145914
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,7168,2048,8,384,4,16,balanced,0.04731733103593191
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,7168,2048,8,384,4,16,balanced,0.11754666765530904
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,7168,2048,8,384,4,16,balanced,0.1879253387451172
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,384,2,32,power_law_1.2,0.2502079963684082
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,7168,2048,8,384,4,16,balanced,0.1164479951063792
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,7168,2048,8,384,4,16,balanced,0.04786666731039683
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,7168,2048,8,384,4,16,power_law_1.01,0.09573119878768921
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,7168,2048,8,384,4,16,balanced,0.18999467293421426
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,7168,2048,8,384,4,16,balanced,0.04984533290068308
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,384,2,32,power_law_1.2,0.33616640567779543
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,7168,2048,8,384,4,16,balanced,0.11899733543395996
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,7168,2048,8,384,4,16,power_law_1.01,0.12829439640045165
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,7168,2048,8,384,4,16,balanced,0.05779199798901876
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,7168,2048,8,384,4,16,balanced,0.19931199153264365
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,7168,2048,8,384,4,16,balanced,0.12152000268300374
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,384,2,32,power_law_1.2,0.43853440284729006
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,7168,2048,8,384,4,16,power_law_1.01,0.16339839696884156
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,7168,2048,8,384,4,16,balanced,0.07196266452471416
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,7168,2048,8,384,4,16,balanced,0.12324266632397969
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,7168,2048,8,384,4,16,balanced,0.21215466658274332
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,7168,2048,8,384,4,16,balanced,0.09136533737182617
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,7168,2048,8,384,4,16,power_law_1.01,0.07466239929199218
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,7168,2048,8,384,4,16,balanced,0.1255519986152649
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,7168,2048,8,384,4,16,balanced,0.11746666828791301
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,7168,2048,8,384,4,16,balanced,0.2325920065244039
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,384,2,32,power_law_1.2,0.509280014038086
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,7168,2048,8,384,4,16,power_law_1.01,0.08401920199394226
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,7168,2048,8,384,4,16,power_law_1.01,0.06974080204963684
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,7168,2048,8,384,4,16,balanced,0.1323360006014506
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,7168,2048,8,384,4,16,balanced,0.11798399686813354
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,384,2,32,power_law_1.2,0.8278783798217774
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,7168,2048,8,384,4,16,power_law_1.01,0.1061568021774292
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,7168,2048,8,384,4,16,balanced,0.2584693431854248
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,7168,2048,8,384,4,16,balanced,0.11885333061218262
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,7168,2048,8,384,4,16,balanced,0.13449066877365112
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,7168,2048,8,384,4,16,power_law_1.01,0.08944000005722046
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,7168,2048,8,384,4,16,power_law_1.01,0.11584000587463379
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,7168,2048,8,384,4,16,balanced,0.11943466464678447
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,7168,2048,8,384,4,16,balanced,0.13958932956059775
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,7168,2048,8,384,4,16,power_law_1.01,0.11088000535964966
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,384,2,32,power_law_1.2,0.9045568466186523
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,7168,2048,8,384,4,16,balanced,0.2922826608022054
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,7168,2048,8,384,4,16,balanced,0.12062399586041768
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,7168,2048,8,384,4,16,power_law_1.01,0.13563519716262817
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,7168,2048,8,384,4,16,power_law_1.01,0.06291840076446534
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,7168,2048,8,384,4,16,balanced,0.1541706621646881
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,384,2,32,power_law_1.2,1.4269887924194335
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,7168,2048,8,384,4,16,balanced,0.1237546702226003
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,7168,2048,8,384,4,16,power_law_1.01,0.14122240543365477
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,7168,2048,8,384,4,16,power_law_1.01,0.0699072003364563
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,7168,2048,8,384,4,16,balanced,0.1672053337097168
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,7168,2048,8,384,4,16,balanced,0.12532266974449158
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,7168,2048,8,384,4,16,balanced,0.34169598420461017
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,7168,2048,8,384,4,16,power_law_1.01,0.1407039999961853
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,7168,2048,8,384,4,16,power_law_1.01,0.0821120023727417
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,384,2,32,power_law_1.2,2.0093055725097657
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,7168,2048,8,384,4,16,balanced,0.12788800398508707
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,7168,2048,8,384,4,16,balanced,0.1930346687634786
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,7168,2048,8,384,4,16,power_law_1.01,0.09127039909362793
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,7168,2048,8,384,4,16,power_law_1.01,0.1441215991973877
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,7168,2048,8,384,4,16,balanced,0.13482133547465006
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,384,2,32,power_law_1.2,2.6368896484375
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,7168,2048,8,384,4,16,power_law_1.01,0.09953280091285706
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,7168,2048,8,384,4,16,power_law_1.01,0.15016319751739501
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,7168,2048,8,384,4,16,balanced,0.3975413242975871
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,7168,2048,8,384,4,16,balanced,0.2232266664505005
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,7168,2048,8,384,4,16,balanced,0.1367573340733846
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,7168,2048,8,384,4,16,power_law_1.01,0.10455039739608765
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,7168,2048,8,384,4,16,power_law_1.01,0.1533504009246826
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,384,2,32,power_law_1.2,3.7911808013916017
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,7168,2048,8,384,4,16,balanced,0.14296533664067587
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,7168,2048,8,384,4,16,power_law_1.01,0.10247039794921875
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,7168,2048,8,384,4,16,power_law_1.01,0.1656000018119812
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,7168,2048,8,384,4,16,balanced,0.2728746732076009
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,7168,2048,8,384,4,16,balanced,0.15919466813405356
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,7168,2048,8,384,4,16,power_law_1.01,0.11032960414886475
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,384,2,32,power_law_1.2,8.004013061523438
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,7168,2048,8,384,4,16,power_law_1.01,0.17672319412231446
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,7168,2048,8,384,4,16,balanced,0.5176213184992472
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,7168,2048,8,384,4,16,power_law_1.01,0.11157759428024291
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,7168,2048,8,384,4,16,power_law_1.01,0.19753600358963014
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,7168,2048,8,384,4,16,balanced,0.32124267021814984
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,7168,2048,8,384,4,16,power_law_1.01,0.11493760347366333
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,7168,2048,8,384,4,16,power_law_1.01,0.19215999841690062
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,7168,2048,8,384,4,16,power_law_1.01,0.11923840045928955
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,384,4,16,balanced,0.1774133245150248
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,7168,2048,8,384,4,16,power_law_1.01,0.210099196434021
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,7168,2048,8,384,4,16,power_law_1.01,0.12761600017547609
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,7168,2048,8,384,4,16,balanced,0.40988266468048096
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,7168,2048,8,384,4,16,power_law_1.01,0.23387520313262938
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,7168,2048,8,384,4,16,power_law_1.01,0.13433599472045898
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,7168,2048,8,384,4,16,balanced,0.6528426806131998
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,7168,2048,8,384,4,16,power_law_1.01,0.29023358821868894
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,7168,2048,8,384,4,16,power_law_1.01,0.14369280338287355
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,7168,2048,8,384,4,16,power_law_1.01,0.17193599939346313
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,7168,2048,8,384,4,16,power_law_1.01,0.30680320262908933
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,7168,2048,8,384,4,16,balanced,0.5393120050430298
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,384,4,16,balanced,0.2050666610399882
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,7168,2048,8,384,4,16,power_law_1.01,0.1814784049987793
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,7168,2048,8,384,4,16,power_law_1.01,0.41139841079711914
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,7168,2048,8,384,4,16,power_law_1.01,0.22629759311676026
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,384,4,16,balanced,0.2327679991722107
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,7168,2048,8,384,4,16,power_law_1.01,0.435916805267334
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,7168,2048,8,384,4,16,power_law_1.01,0.24865920543670655
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,7168,2048,8,384,4,16,power_law_1.01,0.32268800735473635
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,7168,2048,8,384,4,16,power_law_1.01,0.5435135841369629
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,384,4,16,balanced,0.2843946615854899
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,7168,2048,8,384,4,16,balanced,0.8658080101013184
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,7168,2048,8,384,4,16,power_law_1.01,0.39034879207611084
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,7168,2048,8,384,4,16,balanced,0.7290933132171631
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,7168,2048,8,384,4,16,power_law_1.01,0.7295743942260742
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,7168,2048,8,384,4,16,power_law_1.01,0.49188480377197263
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,7168,2048,8,384,4,16,power_law_1.01,0.9498496055603027
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,7168,2048,8,384,4,16,power_law_1.01,0.651417589187622
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,7168,2048,8,384,4,16,power_law_1.01,1.1366208076477051
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,7168,2048,8,384,4,16,power_law_1.01,0.9191295623779296
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,7168,2048,8,384,4,16,power_law_1.01,1.4512191772460938
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,7168,2048,8,384,4,16,power_law_1.01,1.1884480476379395
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,7168,2048,8,384,4,16,power_law_1.01,2.256921577453613
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,7168,2048,8,384,4,16,power_law_1.01,1.4722816467285156
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,384,4,16,balanced,0.36052266756693524
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,7168,2048,8,384,4,16,power_law_1.01,4.246131134033203
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,7168,2048,8,384,4,16,balanced,0.9568640391031901
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,7168,2048,8,384,4,16,power_law_1.01,2.2636608123779296
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,7168,2048,8,384,4,16,balanced,1.0290239651997883
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,7168,2048,8,384,4,16,power_law_1.01,4.512787246704102
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,384,4,16,balanced,0.47785067558288574
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,7168,2048,8,384,4,16,power_law_1.01,0.07246080040931702
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,384,4,16,balanced,0.6499946514765421
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,7168,2048,8,384,4,16,power_law_1.01,0.09388800263404846
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,7168,2048,8,384,4,16,power_law_1.01,0.1177791953086853
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,7168,2048,8,384,4,16,balanced,1.1620159943898518
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,7168,2048,8,384,4,16,power_law_1.01,0.06492159962654113
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,7168,2048,8,384,4,16,power_law_1.01,0.07097600102424621
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,384,4,16,balanced,0.8770453135172526
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,7168,2048,8,384,4,16,power_law_1.01,0.08303359746932984
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,7168,2048,8,384,4,16,power_law_1.01,0.08811519742012024
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,7168,2048,8,384,4,16,power_law_1.01,0.10641920566558838
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,7168,2048,8,384,4,16,balanced,1.5835839907328289
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,7168,2048,8,384,4,16,power_law_1.01,0.10620160102844238
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,7168,2048,8,384,4,16,power_law_1.2,0.09616640210151672
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,7168,2048,8,384,4,16,power_law_1.01,0.10930559635162354
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,7168,2048,8,384,4,16,power_law_1.01,0.11116160154342651
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,7168,2048,8,384,4,16,power_law_1.2,0.12859519720077514
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,7168,2048,8,384,4,16,power_law_1.01,0.11582080125808716
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,7168,2048,8,384,4,16,power_law_1.2,0.09419519901275634
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,7168,2048,8,384,4,16,power_law_1.01,0.12092159986495972
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,7168,2048,8,384,4,16,power_law_1.2,0.07423999905586243
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,7168,2048,8,384,4,16,power_law_1.01,0.12183040380477905
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,384,4,16,balanced,1.1905866463979085
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,7168,2048,8,384,4,16,balanced,1.8010187149047852
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,7168,2048,8,384,4,16,power_law_1.2,0.08583040237426758
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,7168,2048,8,384,4,16,power_law_1.01,0.1402624011039734
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,7168,2048,8,384,4,16,power_law_1.2,0.10080000162124633
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,7168,2048,8,384,4,16,power_law_1.01,0.147705602645874
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,7168,2048,8,384,4,16,power_law_1.2,0.11059839725494384
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,7168,2048,8,384,4,16,power_law_1.01,0.16576000452041625
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,7168,2048,8,384,4,16,power_law_1.2,0.12695679664611817
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,7168,2048,8,384,4,16,power_law_1.01,0.18844799995422362
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,7168,2048,8,384,4,16,power_law_1.2,0.13560320138931276
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,7168,2048,8,384,4,16,power_law_1.2,0.13176319599151612
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,7168,2048,8,384,4,16,power_law_1.2,0.1399359941482544
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,384,4,16,power_law_1.01,0.21511681079864503
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,384,4,16,balanced,1.4678826332092285
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,7168,2048,8,384,4,16,power_law_1.2,0.1453760027885437
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,7168,2048,8,384,4,16,power_law_1.2,0.1497599959373474
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,384,4,16,power_law_1.01,0.24376320838928223
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,7168,2048,8,384,4,16,power_law_1.2,0.15416959524154664
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,7168,2048,8,384,4,16,power_law_1.2,0.16959359645843505
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,384,4,16,power_law_1.01,0.30230400562286375
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,7168,2048,8,384,4,16,power_law_1.2,0.1756160020828247
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,384,4,16,power_law_1.01,0.3870271921157837
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,7168,2048,8,384,4,16,power_law_1.2,0.19740159511566163
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,7168,2048,8,384,4,16,power_law_1.2,0.21386239528656006
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,384,4,16,power_law_1.01,0.5172160148620606
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,7168,2048,8,384,4,16,power_law_1.2,0.24199039936065675
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,7168,2048,8,384,4,16,power_law_1.2,0.2951872110366821
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,384,4,16,power_law_1.01,0.6960256099700928
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,7168,2048,8,384,4,16,balanced,2.932736078898112
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,7168,2048,8,384,4,16,power_law_1.2,0.35041921138763427
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,384,4,16,power_law_1.01,0.9060288429260254
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,7168,2048,8,384,4,16,power_law_1.2,0.4430272102355957
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,384,4,16,power_law_1.01,1.2961471557617188
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,7168,2048,8,384,4,16,power_law_1.2,0.4655168056488037
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,384,4,16,balanced,2.2877279917399087
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,7168,2048,8,384,4,16,power_law_1.2,0.657535982131958
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,384,4,16,power_law_1.01,1.7658304214477538
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,7168,2048,8,384,4,16,power_law_1.2,0.7785727977752686
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,384,4,16,power_law_1.01,2.0690048217773436
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,7168,2048,8,384,4,16,balanced,3.4536959330240884
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,7168,2048,8,384,4,16,power_law_1.2,1.0476479530334473
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,384,4,16,power_law_1.01,3.343577575683594
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,7168,2048,8,384,4,16,power_law_1.2,1.404742431640625
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,384,4,16,power_law_1.01,6.952025604248047
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,7168,2048,8,384,4,16,power_law_1.2,1.839731216430664
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,7168,2048,8,384,4,16,power_law_1.2,2.8311424255371094
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,7168,2048,8,384,4,16,power_law_1.2,5.496518325805664
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,7168,2048,8,384,4,16,power_law_1.2,0.06511359810829162
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,7168,2048,8,384,4,16,power_law_1.2,0.09005439877510071
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,7168,2048,8,384,4,16,power_law_1.2,0.0830847978591919
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,7168,2048,8,384,4,16,power_law_1.2,0.06229760050773621
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,7168,2048,8,384,4,16,power_law_1.2,0.0685696005821228
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,7168,2048,8,384,4,16,power_law_1.2,0.07564799785614014
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,7168,2048,8,384,4,16,power_law_1.2,0.08556159734725952
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,7168,2048,8,384,4,16,power_law_1.2,0.0979200005531311
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,7168,2048,8,384,4,16,power_law_1.2,0.10485759973526002
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,7168,2048,8,384,4,16,power_law_1.2,0.1047104001045227
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,7168,2048,8,384,4,16,power_law_1.2,0.10738559961318969
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,7168,2048,8,384,4,16,power_law_1.2,0.11144959926605225
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,7168,2048,8,384,4,16,power_law_1.2,0.11036800146102906
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,384,4,16,balanced,4.499573389689128
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,7168,2048,8,384,4,16,power_law_1.2,0.1164736032485962
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,7168,2048,8,384,4,16,power_law_1.2,0.13283200263977052
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,7168,2048,8,384,4,16,power_law_1.2,0.140447998046875
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,7168,2048,8,384,4,16,power_law_1.2,0.14954240322113038
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,7168,2048,8,384,4,16,power_law_1.2,0.17082879543304444
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,7168,2048,8,384,4,16,power_law_1.2,0.1828287959098816
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,7168,2048,8,384,8,8,balanced,0.05691733459631602
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,7168,2048,8,384,4,16,power_law_1.2,0.23413760662078859
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,7168,2048,8,384,4,16,power_law_1.2,0.07365120053291321
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,7168,2048,8,384,8,8,balanced,0.05610666672388712
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,7168,2048,8,384,4,16,power_law_1.2,0.25804159641265867
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,7168,2048,8,384,4,16,power_law_1.2,0.09304320216178893
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,7168,2048,8,384,8,8,balanced,0.05996266504128774
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,7168,2048,8,384,4,16,power_law_1.2,0.09217280149459839
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,7168,2048,8,384,4,16,power_law_1.2,0.34686079025268557
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,7168,2048,8,384,8,8,balanced,0.07175999879837036
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,7168,2048,8,384,4,16,power_law_1.2,0.06236799955368042
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,7168,2048,8,384,4,16,power_law_1.2,0.07081599831581116
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,7168,2048,8,384,4,16,power_law_1.2,0.405625581741333
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,7168,2048,8,384,8,8,balanced,0.08930133779843648
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,7168,2048,8,384,4,16,power_law_1.2,0.08170239925384522
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,7168,2048,8,384,8,8,balanced,0.13402133186658224
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,7168,2048,8,384,4,16,power_law_1.2,0.570195198059082
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,7168,2048,8,384,4,16,power_law_1.2,0.08268160223960877
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,7168,2048,8,384,8,8,balanced,0.178874671459198
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,7168,2048,8,384,4,16,power_law_1.2,0.7188735961914062
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,7168,2048,8,384,4,16,power_law_1.2,0.0948415994644165
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,7168,2048,8,384,8,8,balanced,0.1734666625658671
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,7168,2048,8,384,4,16,power_law_1.2,0.10412160158157349
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,7168,2048,8,384,4,16,power_law_1.2,1.01397762298584
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,7168,2048,8,384,8,8,balanced,0.17363200585047403
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,7168,2048,8,384,4,16,power_law_1.2,0.1027008056640625
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,7168,2048,8,384,8,8,balanced,0.18150399128595987
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,7168,2048,8,384,4,16,power_law_1.2,1.273151969909668
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,7168,2048,8,384,4,16,power_law_1.2,0.11075199842453003
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,7168,2048,8,384,8,8,balanced,0.17672000328699747
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,7168,2048,8,384,4,16,power_law_1.2,0.11694719791412353
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,7168,2048,8,384,4,16,power_law_1.2,1.7006080627441407
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,7168,2048,8,384,4,16,power_law_1.2,0.121452796459198
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,7168,2048,8,384,8,8,balanced,0.17916266123453775
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,7168,2048,8,384,4,16,power_law_1.2,0.12591359615325928
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,7168,2048,8,384,8,8,balanced,0.1812480092048645
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,7168,2048,8,384,4,16,power_law_1.2,2.47640323638916
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,7168,2048,8,384,4,16,power_law_1.2,0.13835519552230835
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,7168,2048,8,384,8,8,balanced,0.1828320026397705
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,7168,2048,8,384,4,16,power_law_1.2,0.14733439683914185
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,7168,2048,8,384,8,8,balanced,0.18684266010920206
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,7168,2048,8,384,4,16,power_law_1.2,5.561196899414062
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,7168,2048,8,384,4,16,power_law_1.2,0.16758400201797485
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,7168,2048,8,384,8,8,balanced,0.1981226603190104
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,7168,2048,8,384,4,16,power_law_1.2,0.20923519134521484
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,7168,2048,8,384,8,8,balanced,0.19839467604955038
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,7168,2048,8,384,8,8,balanced,0.21662932634353638
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,384,4,16,power_law_1.2,0.22980480194091796
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,7168,2048,8,384,8,8,balanced,0.2270346681276957
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,384,4,16,power_law_1.2,0.2773184061050415
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,7168,2048,8,384,8,8,balanced,0.25202133258183795
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,384,4,16,power_law_1.2,0.32690560817718506
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,7168,2048,8,384,8,8,balanced,0.2860213319460551
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,384,4,16,power_law_1.2,0.4585984230041504
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,7168,2048,8,384,8,8,balanced,0.336298664410909
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,384,4,16,power_law_1.2,0.5611392021179199
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,384,4,16,power_law_1.2,0.8229951858520508
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,7168,2048,8,384,8,8,balanced,0.3773813247680664
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,384,4,16,power_law_1.2,1.1043264389038085
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,384,4,16,power_law_1.2,1.4506431579589845
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,384,4,16,power_law_1.2,2.0112127304077148
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,7168,2048,8,384,8,8,balanced,0.46351468563079834
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,384,4,16,power_law_1.2,2.2657215118408205
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,384,4,16,power_law_1.2,3.994303894042969
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,7168,2048,8,384,8,8,balanced,0.602453351020813
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,384,4,16,power_law_1.2,8.004338836669922
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,7168,2048,8,384,8,8,balanced,0.04860800007979075
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,7168,2048,8,384,8,8,balanced,0.7874826590220133
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,7168,2048,8,384,8,8,balanced,0.04933866858482361
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,7168,2048,8,384,8,8,balanced,0.050986667474110924
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,7168,2048,8,384,8,8,balanced,0.05874133110046387
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,7168,2048,8,384,8,8,balanced,0.07253866891066234
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,7168,2048,8,384,8,8,balanced,0.09942400455474854
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,7168,2048,8,384,8,8,balanced,0.12558933099110922
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,7168,2048,8,384,8,8,balanced,0.1260586678981781
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,7168,2048,8,384,8,8,balanced,0.1269973317782084
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,7168,2048,8,384,8,8,balanced,0.1274079978466034
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,7168,2048,8,384,8,8,balanced,1.0530186494191487
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,7168,2048,8,384,8,8,balanced,0.12987732887268066
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,7168,2048,8,384,8,8,balanced,0.13181333740552267
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,7168,2048,8,384,8,8,power_law_1.01,0.07049599885940552
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,7168,2048,8,384,8,8,balanced,0.13332800070444742
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,7168,2048,8,384,8,8,power_law_1.01,0.09301120042800903
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,7168,2048,8,384,8,8,balanced,0.13537066181500754
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,7168,2048,8,384,8,8,power_law_1.01,0.12524160146713256
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,7168,2048,8,384,8,8,balanced,0.14552533626556396
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,7168,2048,8,384,8,8,power_law_1.01,0.0711679995059967
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,7168,2048,8,384,8,8,balanced,0.14813333749771118
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,7168,2048,8,384,8,8,balanced,0.1544266641139984
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,7168,2048,8,384,8,8,power_law_1.01,0.08442879915237426
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,7168,2048,8,384,8,8,power_law_1.01,0.05676800012588501
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,7168,2048,8,384,8,8,power_law_1.01,0.0976960003376007
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,7168,2048,8,384,8,8,balanced,0.051167999704678856
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,7168,2048,8,384,8,8,balanced,0.17100799083709717
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,7168,2048,8,384,8,8,power_law_1.01,0.06670719981193543
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,7168,2048,8,384,8,8,balanced,1.3553439776102703
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,7168,2048,8,384,8,8,power_law_1.01,0.10872960090637207
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,7168,2048,8,384,8,8,balanced,0.054586668809254967
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,7168,2048,8,384,8,8,power_law_1.01,0.0900223970413208
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,7168,2048,8,384,8,8,balanced,0.18601600329081217
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,7168,2048,8,384,8,8,power_law_1.01,0.13330559730529784
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,7168,2048,8,384,8,8,balanced,0.05769599974155426
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,7168,2048,8,384,8,8,power_law_1.01,0.06059520244598389
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,7168,2048,8,384,8,8,balanced,0.21914666891098022
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,7168,2048,8,384,8,8,power_law_1.01,0.13474559783935547
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,7168,2048,8,384,8,8,balanced,0.0671253353357315
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,7168,2048,8,384,8,8,power_law_1.01,0.06668800115585327
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,7168,2048,8,384,8,8,power_law_1.01,0.14049279689788818
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,7168,2048,8,384,8,8,balanced,0.08070933322111766
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,7168,2048,8,384,8,8,balanced,0.25567466020584106
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,7168,2048,8,384,8,8,power_law_1.01,0.08377599716186523
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,7168,2048,8,384,8,8,balanced,0.10446400443712871
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,7168,2048,8,384,8,8,power_law_1.01,0.14620800018310548
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,7168,2048,8,384,8,8,power_law_1.01,0.0871295988559723
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,7168,2048,8,384,8,8,balanced,0.1325973371664683
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,7168,2048,8,384,8,8,power_law_1.01,0.1545151948928833
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,7168,2048,8,384,8,8,balanced,0.3062933286031087
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,7168,2048,8,384,8,8,power_law_1.01,0.10264960527420045
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,7168,2048,8,384,8,8,balanced,0.13343999783198038
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,7168,2048,8,384,8,8,power_law_1.01,0.15996160507202148
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,7168,2048,8,384,8,8,power_law_1.01,0.1045375943183899
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,7168,2048,8,384,8,8,balanced,0.1357599993546804
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,7168,2048,8,384,8,8,power_law_1.01,0.1666111946105957
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,7168,2048,8,384,8,8,balanced,0.3652533292770386
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,7168,2048,8,384,8,8,power_law_1.01,0.10583679676055908
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,7168,2048,8,384,8,8,balanced,0.13548266887664795
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,7168,2048,8,384,8,8,power_law_1.01,0.18893439769744874
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,7168,2048,8,384,8,8,balanced,0.13875733812650046
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,7168,2048,8,384,8,8,power_law_1.01,0.10947200059890747
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,7168,2048,8,384,8,8,power_law_1.01,0.1943616032600403
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,7168,2048,8,384,8,8,balanced,0.14149333039919534
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,7168,2048,8,384,8,8,power_law_1.01,0.11537920236587525
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,7168,2048,8,384,8,8,power_law_1.01,0.1956287980079651
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,7168,2048,8,384,8,8,balanced,0.4820266564687093
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,7168,2048,8,384,8,8,balanced,0.14450666308403015
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,7168,2048,8,384,8,8,balanced,1.913669268290202
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,7168,2048,8,384,8,8,power_law_1.01,0.11993600130081176
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,7168,2048,8,384,8,8,power_law_1.01,0.21689600944519044
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,7168,2048,8,384,8,8,balanced,0.1474293371041616
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,7168,2048,8,384,8,8,power_law_1.01,0.1269376039505005
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,7168,2048,8,384,8,8,power_law_1.01,0.2506047964096069
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,7168,2048,8,384,8,8,power_law_1.01,0.06692479848861695
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,7168,2048,8,384,8,8,balanced,0.1562933325767517
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,7168,2048,8,384,8,8,power_law_1.01,0.1384511947631836
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,7168,2048,8,384,8,8,power_law_1.01,0.29462399482727053
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,7168,2048,8,384,8,8,balanced,0.15969600280125937
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,7168,2048,8,384,8,8,power_law_1.01,0.08006399869918823
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,7168,2048,8,384,8,8,balanced,0.6273333231608073
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,7168,2048,8,384,8,8,power_law_1.01,0.1454975962638855
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,7168,2048,8,384,8,8,power_law_1.01,0.32035839557647705
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,7168,2048,8,384,8,8,balanced,0.17094399531682333
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,7168,2048,8,384,8,8,power_law_1.01,0.1076416015625
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,7168,2048,8,384,8,8,power_law_1.01,0.165011203289032
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,7168,2048,8,384,8,8,power_law_1.01,0.41566081047058107
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,7168,2048,8,384,8,8,balanced,0.19154665867487589
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,7168,2048,8,384,8,8,power_law_1.01,0.07045120000839233
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,7168,2048,8,384,8,8,power_law_1.01,0.18781440258026122
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,7168,2048,8,384,8,8,power_law_1.01,0.4841599941253662
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,7168,2048,8,384,8,8,power_law_1.01,0.07774720191955567
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,7168,2048,8,384,8,8,power_law_1.01,0.20567679405212402
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,7168,2048,8,384,8,8,power_law_1.01,0.08760960102081299
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,7168,2048,8,384,8,8,power_law_1.01,0.6344895839691163
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,7168,2048,8,384,8,8,power_law_1.01,0.24863998889923095
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,7168,2048,8,384,8,8,balanced,0.8700533707936605
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,7168,2048,8,384,8,8,power_law_1.01,0.09630720019340515
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,7168,2048,8,384,8,8,power_law_1.01,0.8092608451843262
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,7168,2048,8,384,8,8,power_law_1.01,0.27924480438232424
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,384,8,8,balanced,0.2184213399887085
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,7168,2048,8,384,8,8,power_law_1.01,0.11290880441665649
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,7168,2048,8,384,8,8,power_law_1.01,0.3398080110549927
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,7168,2048,8,384,8,8,power_law_1.01,1.0953280448913574
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,7168,2048,8,384,8,8,power_law_1.01,0.11552000045776367
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,7168,2048,8,384,8,8,power_law_1.01,0.4251264095306396
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,7168,2048,8,384,8,8,power_law_1.01,1.325817584991455
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,7168,2048,8,384,8,8,power_law_1.01,0.1260159969329834
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,7168,2048,8,384,8,8,power_law_1.01,0.5691199779510498
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,7168,2048,8,384,8,8,power_law_1.01,0.12480640411376953
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,7168,2048,8,384,8,8,power_law_1.01,1.597702407836914
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,7168,2048,8,384,8,8,power_law_1.01,0.7406784057617187
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,7168,2048,8,384,8,8,power_law_1.01,0.12791039943695068
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,7168,2048,8,384,8,8,power_law_1.01,2.4374656677246094
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,384,8,8,balanced,0.2751786708831787
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,7168,2048,8,384,8,8,balanced,1.137109359105428
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,7168,2048,8,384,8,8,power_law_1.01,1.0501055717468262
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,7168,2048,8,384,8,8,power_law_1.01,0.13546240329742432
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,7168,2048,8,384,8,8,power_law_1.01,0.1460736036300659
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,7168,2048,8,384,8,8,power_law_1.01,1.3390912055969237
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,7168,2048,8,384,8,8,power_law_1.01,4.6617473602294925
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,384,8,8,balanced,0.3258453408877055
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,7168,2048,8,384,8,8,power_law_1.01,0.16341760158538818
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,7168,2048,8,384,8,8,power_law_1.01,1.5814080238342285
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,7168,2048,8,384,8,8,power_law_1.01,0.17446399927139283
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,384,8,8,balanced,0.40722668170928955
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,7168,2048,8,384,8,8,power_law_1.2,0.06845440268516541
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,7168,2048,8,384,8,8,power_law_1.01,2.465785598754883
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,7168,2048,8,384,8,8,power_law_1.01,0.1925055980682373
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,7168,2048,8,384,8,8,power_law_1.2,0.08134400248527526
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,7168,2048,8,384,8,8,power_law_1.01,0.22906239032745362
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,7168,2048,8,384,8,8,power_law_1.01,5.023353576660156
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,7168,2048,8,384,8,8,power_law_1.2,0.07368959784507752
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,7168,2048,8,384,8,8,power_law_1.2,0.06936960220336914
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,7168,2048,8,384,8,8,balanced,1.4271039962768555
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,7168,2048,8,384,8,8,balanced,3.6209119160970054
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,384,8,8,balanced,0.5249013503392538
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,384,8,8,power_law_1.01,0.26965761184692383
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,7168,2048,8,384,8,8,power_law_1.2,0.08391680121421814
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,7168,2048,8,384,8,8,power_law_1.2,0.09563519954681396
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,384,8,8,power_law_1.01,0.3308288097381592
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,7168,2048,8,384,8,8,power_law_1.2,0.11456639766693115
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,384,8,8,balanced,0.6899840037027994
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,7168,2048,8,384,8,8,power_law_1.2,0.12847360372543334
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,384,8,8,power_law_1.01,0.3858943939208984
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,7168,2048,8,384,8,8,power_law_1.2,0.1338688015937805
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,384,8,8,power_law_1.01,0.5172095775604248
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,7168,2048,8,384,8,8,power_law_1.2,0.13397120237350463
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,384,8,8,balanced,0.9498879909515381
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,384,8,8,power_law_1.01,0.6880767822265625
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,7168,2048,8,384,8,8,power_law_1.2,0.1459328055381775
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,384,8,8,power_law_1.01,0.9133695602416992
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,7168,2048,8,384,8,8,power_law_1.2,0.1529855966567993
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,384,8,8,power_law_1.01,1.2026752471923827
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,7168,2048,8,384,8,8,power_law_1.2,0.15631359815597534
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,7168,2048,8,384,8,8,power_law_1.2,0.17304320335388185
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,7168,2048,8,384,8,8,balanced,2.163263956705729
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,384,8,8,power_law_1.01,1.7635391235351563
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,7168,2048,8,384,8,8,power_law_1.2,0.18525439500808716
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,384,8,8,balanced,1.2941280206044514
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,384,8,8,power_law_1.01,2.2720703125
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,7168,2048,8,384,8,8,power_law_1.2,0.19491200447082518
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,384,8,8,power_law_1.01,2.672889518737793
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,7168,2048,8,384,8,8,power_law_1.2,0.05687040090560913
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,7168,2048,8,384,8,8,power_law_1.2,0.20157439708709718
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,7168,2048,8,384,8,8,power_law_1.2,0.23206400871276855
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,7168,2048,8,384,8,8,power_law_1.2,0.06677759885787964
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,384,8,8,power_law_1.01,4.386771011352539
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,7168,2048,8,384,8,8,power_law_1.2,0.07045120000839233
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,7168,2048,8,384,8,8,power_law_1.2,0.25156478881835936
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,7168,2048,8,384,8,8,power_law_1.2,0.05973119735717773
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,7168,2048,8,384,8,8,power_law_1.2,0.31001598834991456
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,384,8,8,power_law_1.01,8.848076629638673
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,7168,2048,8,384,8,8,power_law_1.2,0.0645695984363556
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,7168,2048,8,384,8,8,power_law_1.2,0.3341759920120239
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,7168,2048,8,384,8,8,power_law_1.2,0.07912960052490234
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,384,8,8,balanced,1.7255412737528484
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,7168,2048,8,384,8,8,power_law_1.2,0.41906561851501467
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,7168,2048,8,384,8,8,power_law_1.2,0.08325120210647582
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,7168,2048,8,384,8,8,power_law_1.2,0.10030080080032348
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,7168,2048,8,384,8,8,power_law_1.2,0.540064001083374
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,7168,2048,8,384,8,8,power_law_1.2,0.1022271990776062
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,7168,2048,8,384,8,8,power_law_1.2,0.10311679840087891
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,7168,2048,8,384,8,8,power_law_1.2,0.6984447956085205
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,7168,2048,8,384,8,8,power_law_1.2,0.11314560174942016
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,7168,2048,8,384,8,8,power_law_1.2,0.8199295997619629
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,7168,2048,8,384,8,8,power_law_1.2,0.11700479984283448
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,7168,2048,8,384,8,8,power_law_1.2,1.23306884765625
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,7168,2048,8,384,8,8,power_law_1.2,0.11998720169067383
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,7168,2048,8,384,8,8,power_law_1.2,0.12540800571441652
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,7168,2048,8,384,8,8,power_law_1.2,1.3862144470214843
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,7168,2048,8,384,8,8,power_law_1.2,0.13741439580917358
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,7168,2048,8,384,8,8,power_law_1.2,0.14588160514831544
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,384,8,8,balanced,2.1394294102986655
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,7168,2048,8,384,8,8,power_law_1.2,1.8008256912231446
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,7168,2048,8,384,8,8,power_law_1.2,0.16174720525741576
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,7168,2048,8,384,8,8,power_law_1.2,2.775961685180664
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,7168,2048,8,384,8,8,power_law_1.2,0.19511040449142455
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,7168,2048,8,384,8,8,power_law_1.2,0.2146239995956421
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,7168,2048,8,384,8,8,power_law_1.2,0.26083199977874755
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,7168,2048,8,384,8,8,power_law_1.2,5.539257431030274
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,7168,2048,8,384,8,8,power_law_1.2,0.27781119346618655
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,7168,2048,8,384,8,8,power_law_1.2,0.3594944000244141
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,7168,2048,8,384,8,8,balanced,4.119301478068034
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,7168,2048,8,384,8,8,power_law_1.2,0.45045762062072753
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,7168,2048,8,384,8,8,power_law_1.2,0.5788479804992676
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,7168,2048,8,384,8,8,power_law_1.2,0.8209535598754882
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,7168,2048,8,384,8,8,power_law_1.2,1.1993791580200195
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,7168,2048,8,384,8,8,power_law_1.2,1.4709376335144042
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,7168,2048,8,384,8,8,power_law_1.2,1.8012800216674805
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,384,8,8,balanced,3.343040148417155
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,7168,2048,8,384,8,8,power_law_1.2,2.953785514831543
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,7168,2048,8,384,8,8,power_law_1.2,6.1643329620361325
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,7168,2048,8,384,8,8,power_law_1.2,0.06744319796562195
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,384,8,8,balanced,6.566901524861653
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,7168,2048,8,384,8,8,power_law_1.2,0.08147839903831482
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,7168,2048,8,384,8,8,power_law_1.2,0.07124480009078979
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,7168,2048,8,384,8,8,power_law_1.2,0.07100160121917724
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,7168,2048,8,384,8,8,power_law_1.2,0.07648640275001525
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,7168,2048,8,384,16,4,balanced,0.05611200133959452
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,7168,2048,8,384,16,4,balanced,0.048885335524876915
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,7168,2048,8,384,8,8,power_law_1.2,0.09009919762611389
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,7168,2048,8,384,16,4,balanced,0.05797333518664042
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,7168,2048,8,384,8,8,power_law_1.2,0.09326080083847046
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,7168,2048,8,384,16,4,balanced,0.050981332858403526
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,7168,2048,8,384,16,4,balanced,0.06205866734186808
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,7168,2048,8,384,16,4,balanced,0.07565866907437642
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,7168,2048,8,384,8,8,power_law_1.2,0.1087231993675232
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,7168,2048,8,384,16,4,balanced,0.053599998354911804
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,7168,2048,8,384,16,4,balanced,0.09681066870689392
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,7168,2048,8,384,16,4,balanced,0.14689600467681885
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,7168,2048,8,384,16,4,balanced,0.06517866750558217
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,7168,2048,8,384,8,8,power_law_1.2,0.11138559579849243
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,7168,2048,8,384,16,4,balanced,0.198634664217631
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,7168,2048,8,384,16,4,balanced,0.0825386643409729
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,7168,2048,8,384,16,4,balanced,0.19356266657511392
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,7168,2048,8,384,8,8,power_law_1.2,0.11641600131988525
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,7168,2048,8,384,16,4,balanced,0.19244267543156943
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,7168,2048,8,384,16,4,balanced,0.1156213382879893
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,7168,2048,8,384,8,8,power_law_1.2,0.12628480195999145
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,7168,2048,8,384,16,4,balanced,0.20407466093699136
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,7168,2048,8,384,16,4,balanced,0.15034133195877075
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,7168,2048,8,384,16,4,balanced,0.19570666551589966
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,7168,2048,8,384,8,8,power_law_1.2,0.1341312050819397
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,7168,2048,8,384,16,4,balanced,0.14898133277893066
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,7168,2048,8,384,16,4,balanced,0.20211732387542725
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,7168,2048,8,384,16,4,balanced,0.2116746703783671
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,7168,2048,8,384,16,4,balanced,0.15081600348154703
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,7168,2048,8,384,8,8,power_law_1.2,0.13526400327682495
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,7168,2048,8,384,16,4,balanced,0.21073599656422934
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,7168,2048,8,384,16,4,balanced,0.15178666512171426
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,7168,2048,8,384,8,8,power_law_1.2,0.14716800451278686
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,7168,2048,8,384,16,4,balanced,0.21805334091186523
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,7168,2048,8,384,16,4,balanced,0.1551040013631185
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,7168,2048,8,384,8,8,power_law_1.2,0.16380800008773805
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,7168,2048,8,384,16,4,balanced,0.22469866275787354
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,7168,2048,8,384,16,4,balanced,0.15794666608174643
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,7168,2048,8,384,16,4,balanced,0.16080000003178915
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,7168,2048,8,384,8,8,power_law_1.2,0.16939519643783568
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,7168,2048,8,384,16,4,balanced,0.21855467557907104
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,7168,2048,8,384,16,4,balanced,0.1632213294506073
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,7168,2048,8,384,16,4,balanced,0.24109333753585815
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,7168,2048,8,384,8,8,power_law_1.2,0.1930176019668579
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,7168,2048,8,384,16,4,balanced,0.17195733388264975
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,7168,2048,8,384,16,4,balanced,0.25760533412297565
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,7168,2048,8,384,8,8,power_law_1.2,0.2410111904144287
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,7168,2048,8,384,16,4,balanced,0.17572800318400064
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,7168,2048,8,384,16,4,balanced,0.2895359992980957
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,7168,2048,8,384,16,4,balanced,0.1865760087966919
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,7168,2048,8,384,16,4,balanced,0.33987732728322345
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,384,8,8,power_law_1.2,0.2718400001525879
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,7168,2048,8,384,16,4,balanced,0.2055786649386088
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,7168,2048,8,384,16,4,balanced,0.3957759936650594
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,7168,2048,8,384,16,4,balanced,0.22838934262593588
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,384,8,8,power_law_1.2,0.34849278926849364
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,7168,2048,8,384,16,4,balanced,0.2738879919052124
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,7168,2048,8,384,16,4,balanced,0.4745279947916667
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,384,8,8,power_law_1.2,0.42211198806762695
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,7168,2048,8,384,16,4,balanced,0.31674132744471234
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,384,8,8,power_law_1.2,0.5835072040557862
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,7168,2048,8,384,16,4,balanced,0.06683200101057689
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,7168,2048,8,384,16,4,balanced,0.07037866612275441
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,7168,2048,8,384,16,4,balanced,0.6145973205566406
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,384,8,8,power_law_1.2,0.7448063850402832
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,7168,2048,8,384,16,4,balanced,0.38388800621032715
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,7168,2048,8,384,16,4,balanced,0.07452266911665599
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,7168,2048,8,384,16,4,balanced,0.08687999844551086
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,384,8,8,power_law_1.2,1.0228799819946288
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,7168,2048,8,384,16,4,balanced,0.10259733597437541
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,7168,2048,8,384,16,4,balanced,0.13424533605575562
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,7168,2048,8,384,16,4,balanced,0.47049065430959064
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,384,8,8,power_law_1.2,1.4393728256225586
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,7168,2048,8,384,16,4,balanced,0.16936000188191733
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,7168,2048,8,384,16,4,balanced,0.7917760213216146
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,7168,2048,8,384,16,4,balanced,0.17073599497477213
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,384,8,8,power_law_1.2,1.8989952087402344
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,7168,2048,8,384,16,4,balanced,0.17417067289352417
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,7168,2048,8,384,16,4,balanced,0.17720532417297363
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,7168,2048,8,384,16,4,balanced,0.634879986445109
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,384,8,8,power_law_1.2,2.386892890930176
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,7168,2048,8,384,16,4,balanced,0.1793760061264038
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,384,8,8,power_law_1.2,3.044595146179199
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,7168,2048,8,384,16,4,balanced,0.18543465932210287
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,7168,2048,8,384,16,4,power_law_1.01,0.05149440169334411
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,7168,2048,8,384,16,4,balanced,1.0884693463643391
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,7168,2048,8,384,16,4,balanced,0.18940800428390503
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,7168,2048,8,384,16,4,power_law_1.01,0.060083198547363284
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,384,8,8,power_law_1.2,4.954444885253906
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,7168,2048,8,384,16,4,power_law_1.01,0.061926400661468504
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,7168,2048,8,384,16,4,balanced,0.19741332530975342
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,7168,2048,8,384,16,4,balanced,0.8255253632863363
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,7168,2048,8,384,16,4,balanced,0.20932267109553018
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,7168,2048,8,384,16,4,power_law_1.01,0.07550719976425171
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,7168,2048,8,384,16,4,power_law_1.01,0.07463039755821228
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,7168,2048,8,384,16,4,balanced,0.21573332945505777
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,384,8,8,power_law_1.2,10.288966369628906
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,7168,2048,8,384,16,4,power_law_1.01,0.08996480107307434
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,7168,2048,8,384,16,4,power_law_1.01,0.062431997060775755
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,7168,2048,8,384,16,4,balanced,0.2326293389002482
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,7168,2048,8,384,16,4,power_law_1.01,0.06977919936180114
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,7168,2048,8,384,16,4,power_law_1.01,0.0763584017753601
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,7168,2048,8,384,16,4,balanced,0.2600319981575012
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,7168,2048,8,384,16,4,power_law_1.01,0.09249920248985291
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,7168,2048,8,384,16,4,power_law_1.01,0.08278399705886841
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,7168,2048,8,384,16,4,balanced,1.4272799491882324
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,7168,2048,8,384,16,4,balanced,1.1674773693084717
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,7168,2048,8,384,16,4,power_law_1.01,0.09775360226631165
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,7168,2048,8,384,16,4,power_law_1.01,0.10601600408554077
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,7168,2048,8,384,16,4,power_law_1.01,0.1134335994720459
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,7168,2048,8,384,16,4,power_law_1.01,0.12227840423583984
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,7168,2048,8,384,16,4,power_law_1.01,0.07429760098457336
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,7168,2048,8,384,16,4,power_law_1.01,0.12239359617233277
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,7168,2048,8,384,16,4,power_law_1.01,0.1422719955444336
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,384,16,4,balanced,0.3189866741498311
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,7168,2048,8,384,16,4,power_law_1.01,0.08209919929504395
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,7168,2048,8,384,16,4,power_law_1.01,0.12042239904403687
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,7168,2048,8,384,16,4,power_law_1.01,0.1466048002243042
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,7168,2048,8,384,16,4,power_law_1.01,0.10120960474014282
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,7168,2048,8,384,16,4,power_law_1.01,0.1333631992340088
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,7168,2048,8,384,16,4,power_law_1.01,0.14967679977416992
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,7168,2048,8,384,16,4,power_law_1.01,0.08556159734725952
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,7168,2048,8,384,16,4,power_law_1.01,0.13946239948272704
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,7168,2048,8,384,16,4,power_law_1.01,0.15453439950942993
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,7168,2048,8,384,16,4,balanced,1.5056692759195964
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,7168,2048,8,384,16,4,power_law_1.01,0.09843199849128723
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,7168,2048,8,384,16,4,power_law_1.01,0.1451840043067932
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,7168,2048,8,384,16,4,power_law_1.01,0.16970880031585694
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,7168,2048,8,384,16,4,balanced,1.7671200434366863
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,384,16,4,balanced,0.42795733610788983
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,7168,2048,8,384,16,4,power_law_1.01,0.11216000318527222
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,7168,2048,8,384,16,4,power_law_1.01,0.15306240320205688
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,7168,2048,8,384,16,4,power_law_1.01,0.16787840127944947
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,7168,2048,8,384,16,4,power_law_1.01,0.12238719463348388
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,384,16,4,balanced,0.5059626499811808
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,7168,2048,8,384,16,4,power_law_1.01,0.1850559949874878
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,7168,2048,8,384,16,4,power_law_1.01,0.16261119842529298
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,7168,2048,8,384,16,4,power_law_1.01,0.1404031991958618
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,7168,2048,8,384,16,4,power_law_1.01,0.19841920137405394
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,7168,2048,8,384,16,4,power_law_1.01,0.17331839799880983
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,7168,2048,8,384,16,4,power_law_1.01,0.14300160408020018
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,384,16,4,balanced,0.625162680943807
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,7168,2048,8,384,16,4,power_law_1.01,0.17662719488143921
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,7168,2048,8,384,16,4,power_law_1.01,0.2247231960296631
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,7168,2048,8,384,16,4,power_law_1.01,0.15500799417495728
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,7168,2048,8,384,16,4,power_law_1.01,0.21185920238494874
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,7168,2048,8,384,16,4,power_law_1.01,0.22449278831481934
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,7168,2048,8,384,16,4,power_law_1.01,0.15550719499588012
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,384,16,4,balanced,0.8281333446502686
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,7168,2048,8,384,16,4,power_law_1.01,0.24970240592956544
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,7168,2048,8,384,16,4,power_law_1.01,0.25109119415283204
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,7168,2048,8,384,16,4,power_law_1.01,0.1714687943458557
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,7168,2048,8,384,16,4,balanced,1.8616906801859539
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,7168,2048,8,384,16,4,power_law_1.01,0.3022527933120728
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,7168,2048,8,384,16,4,power_law_1.01,0.306604790687561
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,7168,2048,8,384,16,4,power_law_1.01,0.17894400358200074
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,7168,2048,8,384,16,4,power_law_1.01,0.33923840522766113
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,384,16,4,balanced,1.0880266825358074
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,7168,2048,8,384,16,4,power_law_1.01,0.3527359962463379
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,7168,2048,8,384,16,4,power_law_1.01,0.1940160036087036
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,7168,2048,8,384,16,4,power_law_1.01,0.4252352237701416
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,7168,2048,8,384,16,4,power_law_1.01,0.3904639959335327
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,7168,2048,8,384,16,4,power_law_1.01,0.20919039249420165
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,7168,2048,8,384,16,4,power_law_1.01,0.5394752025604248
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,7168,2048,8,384,16,4,power_law_1.01,0.21971840858459474
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,7168,2048,8,384,16,4,power_law_1.01,0.47151360511779783
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,7168,2048,8,384,16,4,power_law_1.01,0.7093376159667969
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,7168,2048,8,384,16,4,balanced,2.685786565144857
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,7168,2048,8,384,16,4,power_law_1.01,0.2540607929229736
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,384,16,4,balanced,1.5228373209635417
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,7168,2048,8,384,16,4,power_law_1.01,0.5164095878601074
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,7168,2048,8,384,16,4,power_law_1.01,0.8849151611328125
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,7168,2048,8,384,16,4,power_law_1.01,0.324780797958374
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,7168,2048,8,384,16,4,power_law_1.01,0.6963583946228027
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,7168,2048,8,384,16,4,power_law_1.01,1.2652095794677733
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,7168,2048,8,384,16,4,power_law_1.01,0.8817472457885742
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,7168,2048,8,384,16,4,power_law_1.01,1.6694463729858398
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,384,16,4,power_law_1.01,0.3800575971603394
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,7168,2048,8,384,16,4,power_law_1.01,1.2065216064453126
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,7168,2048,8,384,16,4,power_law_1.01,1.982694435119629
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,7168,2048,8,384,16,4,power_law_1.2,0.06062080264091492
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,7168,2048,8,384,16,4,power_law_1.01,1.641708755493164
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,384,16,4,balanced,2.079253355662028
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,7168,2048,8,384,16,4,power_law_1.01,3.247737503051758
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,384,16,4,power_law_1.01,0.4611392021179199
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,7168,2048,8,384,16,4,power_law_1.2,0.07600640058517456
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,7168,2048,8,384,16,4,balanced,2.887141227722168
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,7168,2048,8,384,16,4,power_law_1.01,1.9663808822631836
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,384,16,4,power_law_1.01,0.5568640232086182
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,7168,2048,8,384,16,4,power_law_1.2,0.06444799900054932
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,7168,2048,8,384,16,4,power_law_1.01,6.456883239746094
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,7168,2048,8,384,16,4,power_law_1.01,2.9781824111938477
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,384,16,4,power_law_1.01,0.7512447834014893
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,7168,2048,8,384,16,4,power_law_1.2,0.07180160284042358
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,7168,2048,8,384,16,4,power_law_1.2,0.08483200073242188
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,384,16,4,power_law_1.01,0.9724479675292969
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,7168,2048,8,384,16,4,power_law_1.01,5.5746112823486325
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,7168,2048,8,384,16,4,power_law_1.2,0.10528000593185424
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,384,16,4,power_law_1.01,1.3392895698547362
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,7168,2048,8,384,16,4,power_law_1.2,0.1096127986907959
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,384,16,4,power_law_1.01,1.7207487106323243
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,384,16,4,balanced,2.8178399403889975
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,7168,2048,8,384,16,4,power_law_1.2,0.13583999872207642
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,384,16,4,power_law_1.01,2.457209587097168
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,7168,2048,8,384,16,4,power_law_1.2,0.1413823962211609
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,384,16,4,power_law_1.01,3.132595252990723
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,7168,2048,8,384,16,4,power_law_1.2,0.14892159700393676
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,7168,2048,8,384,16,4,power_law_1.2,0.15751680135726928
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,384,16,4,power_law_1.01,4.010956954956055
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,7168,2048,8,384,16,4,power_law_1.2,0.1665984034538269
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,384,16,4,power_law_1.01,6.360902404785156
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,7168,2048,8,384,16,4,power_law_1.2,0.17307519912719727
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,7168,2048,8,384,16,4,power_law_1.2,0.18935680389404297
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,384,16,4,power_law_1.01,12.035526275634766
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,7168,2048,8,384,16,4,power_law_1.2,0.20570240020751954
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,384,16,4,balanced,3.492645263671875
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,7168,2048,8,384,16,4,power_law_1.2,0.2212671995162964
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,7168,2048,8,384,16,4,balanced,5.01421324412028
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,7168,2048,8,384,16,4,power_law_1.2,0.22315518856048583
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,7168,2048,8,384,16,4,power_law_1.2,0.25691521167755127
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,7168,2048,8,384,16,4,power_law_1.2,0.30919039249420166
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,7168,2048,8,384,16,4,power_law_1.2,0.369158411026001
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,7168,2048,8,384,16,4,power_law_1.2,0.40447359085083007
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,7168,2048,8,384,16,4,power_law_1.2,0.500057601928711
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,7168,2048,8,384,16,4,power_law_1.2,0.5782336235046387
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,7168,2048,8,384,16,4,balanced,5.510245641072591
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,7168,2048,8,384,16,4,power_law_1.2,0.8059967994689942
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,7168,2048,8,384,16,4,power_law_1.2,0.9328512191772461
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,384,16,4,balanced,5.459317525227864
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,7168,2048,8,384,16,4,power_law_1.2,1.3204031944274903
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,7168,2048,8,384,16,4,power_law_1.2,1.8114879608154297
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,7168,2048,8,384,16,4,power_law_1.2,2.1835840225219725
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,7168,2048,8,384,16,4,power_law_1.2,3.460313415527344
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,7168,2048,8,384,16,4,power_law_1.2,7.114227294921875
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,7168,2048,8,384,16,4,power_law_1.2,0.051507198810577394
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,7168,2048,8,384,16,4,power_law_1.2,0.06216959953308106
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,7168,2048,8,384,16,4,power_law_1.2,0.05788800120353699
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,7168,2048,8,384,16,4,power_law_1.2,0.0616703987121582
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,7168,2048,8,384,16,4,power_law_1.2,0.07354879975318909
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,7168,2048,8,384,16,4,power_law_1.2,0.08465279936790467
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,7168,2048,8,384,16,4,power_law_1.2,0.09219840168952942
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,7168,2048,8,384,16,4,power_law_1.2,0.10650880336761474
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,7168,2048,8,384,16,4,power_law_1.2,0.11701760292053223
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,7168,2048,8,384,16,4,power_law_1.2,0.11749759912490845
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,384,16,4,balanced,10.717829386393229
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,7168,2048,8,384,16,4,power_law_1.2,0.12996480464935303
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,7168,2048,8,384,16,4,power_law_1.2,0.13980159759521485
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,7168,2048,8,384,16,4,power_law_1.2,0.14711040258407593
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,7168,2048,8,384,16,4,power_law_1.2,0.15135999917984008
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,7168,2048,8,384,16,4,power_law_1.2,0.1668544054031372
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,7168,2048,8,384,16,4,power_law_1.2,0.17280639410018922
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,7168,2048,8,384,16,4,power_law_1.2,0.18099199533462523
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,7168,2048,8,384,16,4,power_law_1.2,0.21704320907592772
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,7168,2048,8,384,16,4,power_law_1.2,0.2518464088439941
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,7168,2048,8,384,16,4,power_law_1.2,0.31346559524536133
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,7168,2048,8,384,16,4,power_law_1.2,0.35136640071868896
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,7168,2048,8,384,16,4,power_law_1.2,0.43893117904663087
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,7168,2048,8,384,16,4,power_law_1.2,0.5683584213256836
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,7168,2048,8,384,16,4,power_law_1.2,0.733523178100586
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,7168,2048,8,384,16,4,power_law_1.2,0.9517056465148925
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,7168,2048,8,384,16,4,power_law_1.2,1.4353599548339844
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,7168,2048,8,384,16,4,power_law_1.2,1.8449983596801758
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,7168,2048,8,384,16,4,power_law_1.2,2.2062847137451174
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,7168,2048,8,384,16,4,power_law_1.2,3.4391807556152343
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,7168,2048,8,384,32,2,balanced,0.0590826670328776
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,7168,2048,8,384,16,4,power_law_1.2,6.902252960205078
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,7168,2048,8,384,32,2,balanced,0.06192000210285187
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,7168,2048,8,384,32,2,balanced,0.07039999961853027
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,7168,2048,8,384,16,4,power_law_1.2,0.0744383990764618
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,7168,2048,8,384,32,2,balanced,0.08799466490745544
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,7168,2048,8,384,32,2,balanced,0.12616533041000366
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,7168,2048,8,384,16,4,power_law_1.2,0.08213120102882385
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,7168,2048,8,384,32,2,balanced,0.1810986598332723
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,7168,2048,8,384,16,4,power_law_1.2,0.0809664011001587
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,7168,2048,8,384,32,2,balanced,0.2390026648839315
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,7168,2048,8,384,16,4,power_law_1.2,0.08705919981002808
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,7168,2048,8,384,32,2,balanced,0.22738132874170938
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,7168,2048,8,384,16,4,power_law_1.2,0.0959231972694397
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,7168,2048,8,384,32,2,balanced,0.22931732734044394
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,7168,2048,8,384,16,4,power_law_1.2,0.1096384048461914
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,7168,2048,8,384,32,2,balanced,0.22678399085998535
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,7168,2048,8,384,16,4,power_law_1.2,0.12013440132141114
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,7168,2048,8,384,32,2,balanced,0.2328746716181437
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,7168,2048,8,384,32,2,balanced,0.0528053343296051
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,7168,2048,8,384,32,2,balanced,0.23595199982325235
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,7168,2048,8,384,16,4,power_law_1.2,0.13393919467926024
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,7168,2048,8,384,32,2,balanced,0.2383093237876892
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,7168,2048,8,384,32,2,balanced,0.05639466643333435
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,7168,2048,8,384,16,4,power_law_1.2,0.13824000358581542
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,7168,2048,8,384,32,2,balanced,0.06477866570154826
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,7168,2048,8,384,32,2,balanced,0.24456000328063965
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,7168,2048,8,384,16,4,power_law_1.2,0.1450943946838379
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,7168,2048,8,384,32,2,balanced,0.07932800054550171
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,7168,2048,8,384,32,2,balanced,0.2554080088933309
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,7168,2048,8,384,16,4,power_law_1.2,0.15233919620513917
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,7168,2048,8,384,32,2,balanced,0.10910933216412862
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,7168,2048,8,384,32,2,balanced,0.25832533836364746
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,7168,2048,8,384,32,2,balanced,0.15715733170509338
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,7168,2048,8,384,16,4,power_law_1.2,0.1716096043586731
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,7168,2048,8,384,32,2,balanced,0.268885334332784
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,7168,2048,8,384,32,2,balanced,0.20892266432444254
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,7168,2048,8,384,16,4,power_law_1.2,0.17662080526351928
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,7168,2048,8,384,32,2,balanced,0.21158399184544882
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,7168,2048,8,384,32,2,balanced,0.29958399136861164
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,7168,2048,8,384,16,4,power_law_1.2,0.19881600141525269
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,7168,2048,8,384,32,2,balanced,0.21364800135294595
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,7168,2048,8,384,32,2,balanced,0.32678399483362836
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,7168,2048,8,384,32,2,balanced,0.21520533164342245
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,7168,2048,8,384,16,4,power_law_1.2,0.20908160209655763
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,7168,2048,8,384,32,2,power_law_1.01,0.05850239992141724
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,7168,2048,8,384,32,2,balanced,0.21754666169484457
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,7168,2048,8,384,32,2,balanced,0.38165334860483807
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,7168,2048,8,384,16,4,power_law_1.2,0.2219327926635742
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,7168,2048,8,384,32,2,power_law_1.01,0.07356799840927124
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,7168,2048,8,384,32,2,balanced,0.22168533007303873
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,7168,2048,8,384,16,4,power_law_1.2,0.2566976070404053
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,7168,2048,8,384,32,2,balanced,0.4604959885279338
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,7168,2048,8,384,32,2,balanced,0.22500799099604288
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,7168,2048,8,384,32,2,power_law_1.01,0.08460800051689148
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,7168,2048,8,384,16,4,power_law_1.2,0.321561598777771
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,7168,2048,8,384,32,2,balanced,0.2297439972559611
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,7168,2048,8,384,32,2,power_law_1.01,0.07809919714927674
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,7168,2048,8,384,32,2,balanced,0.5502719879150391
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,7168,2048,8,384,32,2,balanced,0.23540266354878744
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,7168,2048,8,384,32,2,power_law_1.01,0.10780160427093506
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,7168,2048,8,384,32,2,balanced,0.247871994972229
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,384,16,4,power_law_1.2,0.3881279945373535
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,7168,2048,8,384,32,2,power_law_1.01,0.1331007957458496
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,7168,2048,8,384,32,2,balanced,0.26048000653584796
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,7168,2048,8,384,32,2,balanced,0.6809386412302653
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,7168,2048,8,384,32,2,power_law_1.01,0.1479423999786377
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,7168,2048,8,384,32,2,balanced,0.29068267345428467
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,7168,2048,8,384,32,2,power_law_1.01,0.16726399660110475
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,384,16,4,power_law_1.2,0.5028416156768799
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,7168,2048,8,384,32,2,balanced,0.3301493326822917
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,7168,2048,8,384,32,2,balanced,0.9246133168538412
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,7168,2048,8,384,32,2,power_law_1.01,0.17102080583572388
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,384,16,4,power_law_1.2,0.5652736186981201
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,7168,2048,8,384,32,2,balanced,0.38330666224161786
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,7168,2048,8,384,32,2,power_law_1.01,0.17816319465637206
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,384,16,4,power_law_1.2,0.7543871879577637
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,7168,2048,8,384,32,2,power_law_1.01,0.1847551941871643
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,7168,2048,8,384,32,2,balanced,0.4529759883880615
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,384,16,4,power_law_1.2,1.0256959915161132
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,7168,2048,8,384,32,2,power_law_1.01,0.052153599262237546
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,7168,2048,8,384,32,2,power_law_1.01,0.19503999948501588
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,384,16,4,power_law_1.2,1.3196352005004883
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,7168,2048,8,384,32,2,balanced,1.2360320091247559
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,7168,2048,8,384,32,2,balanced,0.5468746821085612
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,7168,2048,8,384,32,2,power_law_1.01,0.20279040336608886
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,7168,2048,8,384,32,2,power_law_1.01,0.05793280005455017
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,384,16,4,power_law_1.2,1.880998420715332
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,7168,2048,8,384,32,2,power_law_1.01,0.22013440132141113
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,7168,2048,8,384,32,2,power_law_1.01,0.07318400144577027
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,384,16,4,power_law_1.2,2.7283775329589846
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,7168,2048,8,384,32,2,power_law_1.01,0.2326335906982422
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,7168,2048,8,384,32,2,balanced,0.6809013684590658
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,7168,2048,8,384,32,2,power_law_1.01,0.0753279983997345
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,384,16,4,power_law_1.2,3.4946369171142577
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,7168,2048,8,384,32,2,power_law_1.01,0.2464063882827759
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,7168,2048,8,384,32,2,power_law_1.01,0.09036160111427308
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,7168,2048,8,384,32,2,balanced,1.7116692860921223
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,7168,2048,8,384,32,2,power_law_1.01,0.2624768018722534
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,384,16,4,power_law_1.2,4.626188659667969
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,7168,2048,8,384,32,2,balanced,0.9446400006612142
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,7168,2048,8,384,32,2,power_law_1.01,0.11393920183181763
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,7168,2048,8,384,32,2,power_law_1.01,0.31032960414886473
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,384,16,4,power_law_1.2,6.680083465576172
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,7168,2048,8,384,32,2,power_law_1.01,0.12584320306777955
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,7168,2048,8,384,32,2,power_law_1.01,0.33860480785369873
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,7168,2048,8,384,32,2,power_law_1.01,0.15175039768218995
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,7168,2048,8,384,32,2,power_law_1.01,0.46109437942504883
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,384,16,4,power_law_1.2,14.31700439453125
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,7168,2048,8,384,32,2,power_law_1.01,0.4683839797973633
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,7168,2048,8,384,32,2,balanced,1.2504106362660725
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,7168,2048,8,384,32,2,power_law_1.01,0.1575103998184204
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,7168,2048,8,384,32,2,power_law_1.01,0.6142208099365234
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,7168,2048,8,384,32,2,power_law_1.01,0.16696319580078126
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,7168,2048,8,384,32,2,balanced,2.1916747093200684
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,7168,2048,8,384,32,2,power_law_1.01,0.7393152236938476
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,7168,2048,8,384,32,2,power_law_1.01,0.17579519748687744
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,7168,2048,8,384,32,2,power_law_1.01,0.9964351654052734
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,7168,2048,8,384,32,2,power_law_1.01,0.18279039859771729
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,7168,2048,8,384,32,2,power_law_1.01,1.2758527755737306
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,7168,2048,8,384,32,2,power_law_1.01,0.19173760414123536
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,7168,2048,8,384,32,2,balanced,1.7846986452738445
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,7168,2048,8,384,32,2,power_law_1.01,0.20698881149291992
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,7168,2048,8,384,32,2,power_law_1.01,1.8395135879516602
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,7168,2048,8,384,32,2,power_law_1.01,0.22673919200897216
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,7168,2048,8,384,32,2,power_law_1.01,2.3847360610961914
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,7168,2048,8,384,32,2,power_law_1.01,0.24051198959350586
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,7168,2048,8,384,32,2,power_law_1.01,2.7516672134399416
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,7168,2048,8,384,32,2,balanced,2.718085289001465
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,7168,2048,8,384,32,2,power_law_1.01,0.25082879066467284
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,7168,2048,8,384,32,2,power_law_1.01,4.528480148315429
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,7168,2048,8,384,32,2,power_law_1.01,0.301363205909729
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,7168,2048,8,384,32,2,balanced,2.3032213846842446
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,7168,2048,8,384,32,2,power_law_1.01,0.3422399997711182
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,7168,2048,8,384,32,2,power_law_1.01,9.188633728027344
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,7168,2048,8,384,32,2,power_law_1.01,0.4449151992797852
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,7168,2048,8,384,32,2,power_law_1.01,0.4756671905517578
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,7168,2048,8,384,32,2,power_law_1.01,0.6103936195373535
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,7168,2048,8,384,32,2,power_law_1.01,0.7379776000976562
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,7168,2048,8,384,32,2,power_law_1.01,0.9983679771423339
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,7168,2048,8,384,32,2,balanced,2.880202611287435
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,7168,2048,8,384,32,2,power_law_1.01,1.3015168190002442
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,7168,2048,8,384,32,2,power_law_1.01,1.7846527099609375
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,7168,2048,8,384,32,2,balanced,4.189413388570149
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,7168,2048,8,384,32,2,power_law_1.01,2.4348543167114256
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,7168,2048,8,384,32,2,power_law_1.01,2.879680061340332
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,7168,2048,8,384,32,2,power_law_1.01,4.620038223266602
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,7168,2048,8,384,32,2,power_law_1.01,9.157305908203124
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,7168,2048,8,384,32,2,power_law_1.2,0.05878400206565857
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,7168,2048,8,384,32,2,power_law_1.2,0.07352319955825806
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,7168,2048,8,384,32,2,power_law_1.2,0.07541120052337646
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,7168,2048,8,384,32,2,balanced,4.452426592508952
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,7168,2048,8,384,32,2,power_law_1.2,0.08053759932518005
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,7168,2048,8,384,32,2,power_law_1.2,0.10529919862747192
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,7168,2048,8,384,32,2,power_law_1.2,0.122707200050354
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,7168,2048,8,384,32,2,power_law_1.2,0.13445119857788085
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,7168,2048,8,384,32,2,power_law_1.2,0.16053119897842408
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,7168,2048,8,384,32,2,power_law_1.2,0.1686911940574646
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,7168,2048,8,384,32,2,power_law_1.2,0.17751679420471192
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,7168,2048,8,384,32,2,power_law_1.2,0.1861248016357422
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,7168,2048,8,384,32,2,power_law_1.2,0.1929152011871338
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,7168,2048,8,384,32,2,power_law_1.2,0.2029695987701416
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,7168,2048,8,384,32,2,power_law_1.2,0.2171328067779541
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,7168,2048,8,384,32,2,power_law_1.2,0.23248639106750488
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,7168,2048,8,384,32,2,balanced,7.844730377197266
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,7168,2048,8,384,32,2,power_law_1.2,0.2489856004714966
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,7168,2048,8,384,32,2,power_law_1.2,0.27435519695281985
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,7168,2048,8,384,32,2,power_law_1.2,0.3229055881500244
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,7168,2048,8,384,32,2,power_law_1.2,0.3529983997344971
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,7168,2048,8,384,32,2,power_law_1.2,0.4731776237487793
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,7168,2048,8,384,32,2,power_law_1.2,0.533516788482666
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,7168,2048,8,384,32,2,power_law_1.2,0.6728384017944335
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,7168,2048,8,384,32,2,balanced,8.44807497660319
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,7168,2048,8,384,32,2,power_law_1.2,0.8210816383361816
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,7168,2048,8,384,32,2,power_law_1.2,1.0267583847045898
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,7168,2048,8,384,32,2,power_law_1.2,1.3314240455627442
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,7168,2048,8,384,32,2,power_law_1.2,1.9267391204833983
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,7168,2048,8,384,32,2,power_law_1.2,2.4046335220336914
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,7168,2048,8,384,32,2,power_law_1.2,0.05195519924163818
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,7168,2048,8,384,32,2,power_law_1.2,2.9664064407348634
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,7168,2048,8,384,32,2,power_law_1.2,0.05806080102920532
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,7168,2048,8,384,32,2,power_law_1.2,4.635456085205078
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,7168,2048,8,384,32,2,power_law_1.2,0.06446080207824707
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,7168,2048,8,384,32,2,power_law_1.2,0.07362560033798218
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,7168,2048,8,384,32,2,power_law_1.2,8.868876647949218
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,7168,2048,8,384,32,2,power_law_1.2,0.08632320165634155
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,7168,2048,8,384,32,2,power_law_1.2,0.1092352032661438
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,7168,2048,8,384,32,2,power_law_1.2,0.1158784031867981
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,7168,2048,8,384,32,2,power_law_1.2,0.14832639694213867
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,7168,2048,8,384,32,2,power_law_1.2,0.15022720098495485
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,7168,2048,8,384,32,2,power_law_1.2,0.16062719821929933
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,128,1,64,balanced,0.056133334835370384
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,7168,2048,8,384,32,2,power_law_1.2,0.1677183985710144
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,128,1,64,balanced,0.056746666630109154
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,7168,2048,8,384,32,2,power_law_1.2,0.184607994556427
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,128,1,64,balanced,0.056176001826922096
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,7168,2048,8,384,32,2,power_law_1.2,0.19360640048980712
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,128,1,64,balanced,0.053818667928377785
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,7168,2048,8,384,32,2,power_law_1.2,0.20647039413452148
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,128,1,64,balanced,0.05871466795603434
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,128,1,64,balanced,0.07451733450094859
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,7168,2048,8,384,32,2,power_law_1.2,0.22415359020233155
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,128,1,64,power_law_1.01,0.06748160123825073
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,128,1,64,balanced,0.08011733492215474
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,7168,2048,8,384,32,2,power_law_1.2,0.24015359878540038
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,128,1,64,balanced,0.08667199810345967
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,128,1,64,power_law_1.01,0.05792639851570129
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,7168,2048,8,384,32,2,power_law_1.2,0.25471360683441163
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,128,1,64,balanced,0.09366933504740398
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,128,1,64,power_law_1.01,0.057081598043441775
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,128,1,64,balanced,0.09544000029563904
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,7168,2048,8,384,32,2,power_law_1.2,0.3039103984832764
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,128,1,64,power_law_1.01,0.054079997539520266
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,128,1,64,balanced,0.09277333815892537
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,128,1,64,power_law_1.01,0.05982720255851746
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,7168,2048,8,384,32,2,power_law_1.2,0.3534784078598022
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,128,1,64,balanced,0.09019200007120769
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,128,1,64,power_law_1.01,0.0705344021320343
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,7168,2048,8,384,32,2,power_law_1.2,0.4453887939453125
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,128,1,64,power_law_1.01,0.07838720083236694
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,128,1,64,balanced,0.09175466497739156
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,128,1,64,power_law_1.01,0.07654399871826172
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,7168,2048,8,384,32,2,power_law_1.2,0.4990975856781006
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,128,1,64,balanced,0.0920906662940979
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,128,1,64,power_law_1.01,0.08663039803504943
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,128,1,64,balanced,0.0899733304977417
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,7168,2048,8,384,32,2,power_law_1.2,0.6402880191802979
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,128,1,64,power_law_1.01,0.08783360123634339
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,128,1,64,power_law_1.2,0.06746240258216858
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,128,1,64,balanced,0.0890826682249705
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,128,1,64,power_law_1.01,0.08775039911270141
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,7168,2048,8,384,32,2,power_law_1.2,0.7492800235748291
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,128,1,64,power_law_1.2,0.0574720025062561
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,128,1,64,power_law_1.01,0.08702080249786377
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,128,1,64,balanced,0.09276800354321797
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,128,1,64,power_law_1.01,0.08831999897956848
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,7168,2048,8,384,32,2,power_law_1.2,1.0241984367370605
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,128,1,64,power_law_1.2,0.055904000997543335
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,128,1,64,balanced,0.09582933783531189
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,128,1,64,power_law_1.01,0.08912640213966369
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,128,1,64,power_law_1.2,0.05390080213546753
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,7168,2048,8,384,32,2,power_law_1.2,1.3405119895935058
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,128,1,64,power_law_1.01,0.08821759819984436
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,128,1,64,balanced,0.09898133079210918
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,128,1,64,power_law_1.2,0.05818880200386047
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,128,1,64,power_law_1.01,0.08988800048828124
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,7168,2048,8,384,32,2,power_law_1.2,1.9416383743286132
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,128,1,64,balanced,0.10813333590825398
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,128,1,64,power_law_1.01,0.09267839789390564
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,128,1,64,power_law_1.2,0.06874880194664001
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,128,1,64,power_law_1.01,0.10561920404434204
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,128,1,64,balanced,0.11545600493748982
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,7168,2048,8,384,32,2,power_law_1.2,2.4577472686767576
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,128,1,64,power_law_1.01,0.1215999960899353
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,128,1,64,power_law_1.2,0.08196480274200439
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,128,1,64,power_law_1.01,0.13006720542907715
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,128,1,64,power_law_1.2,0.0808896005153656
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,128,1,64,balanced,0.13487466176350912
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,7168,2048,8,384,32,2,power_law_1.2,3.0689664840698243
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,128,1,64,power_law_1.01,0.1511423945426941
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,128,1,64,power_law_1.2,0.08952320218086243
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,128,1,64,power_law_1.01,0.23082239627838136
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,128,1,64,balanced,0.15380799770355225
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,7168,2048,8,384,32,2,power_law_1.2,4.910911941528321
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,128,1,64,power_law_1.2,0.09016960263252258
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,128,1,64,power_law_1.01,0.29119999408721925
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,128,1,64,power_law_1.01,0.4077184200286865
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,128,1,64,power_law_1.2,0.0902463972568512
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,128,1,64,power_law_1.01,0.5820799827575683
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,128,1,64,power_law_1.2,0.0925055980682373
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,128,1,64,balanced,0.21489065885543823
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,7168,2048,8,384,32,2,power_law_1.2,10.647551727294921
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,128,1,64,power_law_1.01,0.7398015975952148
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,128,1,64,power_law_1.2,0.08954240083694458
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,128,1,64,power_law_1.01,1.0889727592468261
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,128,1,64,power_law_1.2,0.08925439715385437
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,128,1,64,power_law_1.01,1.4416704177856445
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,128,1,64,balanced,0.2565760016441345
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,128,1,64,power_law_1.2,0.0926912009716034
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,128,1,64,power_law_1.01,2.3191999435424804
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,128,1,64,power_law_1.2,0.09292799830436707
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,128,1,64,power_law_1.01,4.571404647827149
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,128,1,64,power_law_1.2,0.11175040006637574
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,128,1,64,balanced,0.3760480086008708
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,128,1,64,power_law_1.2,0.11477760076522828
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,128,1,64,power_law_1.2,0.13715200424194335
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,128,1,64,power_law_1.2,0.1667904019355774
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,128,2,32,balanced,0.04784533381462097
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,128,1,64,power_law_1.2,0.2169408082962036
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,128,1,64,balanced,0.4867200056711833
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,128,2,32,balanced,0.04851733148097992
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,128,1,64,power_law_1.2,0.2959552049636841
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,128,2,32,balanced,0.04910400013128916
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,128,1,64,power_law_1.2,0.3775552034378052
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,128,2,32,balanced,0.04747200012207031
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,128,2,32,balanced,0.05067199965318044
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,128,1,64,power_law_1.2,0.5481408119201661
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,128,2,32,balanced,0.056048000852266945
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,128,1,64,balanced,0.6013546784718832
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,128,2,32,balanced,0.06381333371003468
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,128,1,64,power_law_1.2,0.7373504161834716
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,128,2,32,power_law_1.01,0.06997759938240052
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,128,2,32,balanced,0.06530666848023732
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,128,1,64,power_law_1.2,1.2168000221252442
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,128,2,32,power_law_1.01,0.06064640283584595
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,128,2,32,balanced,0.07308266560236613
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,128,1,64,power_law_1.2,1.5352704048156738
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,128,2,32,power_law_1.01,0.050406402349472045
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,128,2,32,balanced,0.07504533231258392
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,128,1,64,power_law_1.2,2.507084846496582
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,128,2,32,balanced,0.07702399790287018
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,128,2,32,power_law_1.01,0.0472896009683609
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,128,2,32,balanced,0.07459733386834462
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,128,1,64,power_law_1.2,3.3548862457275392
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,128,2,32,power_law_1.01,0.050361597537994386
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,128,2,32,balanced,0.07387733459472656
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,128,2,32,power_law_1.01,0.05514240264892578
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,128,1,64,balanced,0.9445280234018961
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,128,2,32,balanced,0.07287999987602234
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,128,1,64,power_law_1.2,9.58115234375
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,128,2,32,power_law_1.01,0.06250240206718445
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,128,2,32,balanced,0.07422400017579396
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,128,2,32,power_law_1.01,0.0636031985282898
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,128,2,32,balanced,0.07380799949169159
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,128,2,32,power_law_1.01,0.07616639733314515
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,128,2,32,balanced,0.07713599999745686
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,128,2,32,power_law_1.01,0.08366720080375671
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,128,2,32,balanced,0.08061866462230682
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,128,2,32,power_law_1.01,0.0749888002872467
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,128,2,32,balanced,0.08365866541862488
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,128,2,32,power_law_1.01,0.07712000012397766
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,128,2,32,balanced,0.09156800309816997
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,128,2,32,power_law_1.2,0.07011200189590454
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,128,2,32,power_law_1.01,0.08174719810485839
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,128,2,32,balanced,0.09801066915194194
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,128,2,32,power_law_1.01,0.08144639730453491
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,128,2,32,power_law_1.2,0.06090239882469177
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,128,2,32,power_law_1.01,0.07262719869613647
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,128,2,32,power_law_1.2,0.05097600221633911
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,128,2,32,balanced,0.11479999621709187
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,128,2,32,power_law_1.01,0.07502080202102661
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,128,2,32,power_law_1.2,0.04952319860458374
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,128,1,64,balanced,1.8640693028767903
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,128,2,32,balanced,0.13481600085894266
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,128,2,32,power_law_1.01,0.08305280208587647
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,128,2,32,power_law_1.2,0.05065600275993347
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,128,2,32,power_law_1.01,0.0837440013885498
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,128,2,32,power_law_1.2,0.05480960011482239
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,128,2,32,power_law_1.01,0.11706880331039429
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,128,2,32,balanced,0.20874667167663574
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,128,2,32,power_law_1.2,0.06306560039520263
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,128,2,32,power_law_1.01,0.12468479871749878
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,128,2,32,power_law_1.2,0.06370559930801392
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,128,2,32,power_law_1.01,0.14213119745254515
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,128,2,32,balanced,0.24750399589538574
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,128,2,32,power_law_1.2,0.07896959781646729
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,128,2,32,power_law_1.01,0.19377919435501098
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,128,2,32,power_law_1.2,0.07592960000038147
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,128,2,32,power_law_1.01,0.2207103967666626
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,128,2,32,power_law_1.2,0.07992320060729981
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,128,2,32,power_law_1.01,0.32660479545593263
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,128,2,32,balanced,0.35786668459574383
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,128,2,32,power_law_1.2,0.07678719758987426
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,128,2,32,power_law_1.01,0.45098237991333007
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,128,2,32,power_law_1.2,0.07811840176582337
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,128,2,32,power_law_1.01,0.6245503902435303
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,128,2,32,power_law_1.2,0.07495679855346679
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,128,2,32,power_law_1.01,0.7568384170532226
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,128,4,16,balanced,0.033376000821590424
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,128,2,32,power_law_1.2,0.08113279938697815
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,128,2,32,balanced,0.46481064955393475
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,128,2,32,power_law_1.01,1.075692844390869
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,128,2,32,power_law_1.2,0.07583360075950622
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,128,4,16,balanced,0.035173334181308746
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,128,2,32,power_law_1.01,1.6258495330810547
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,128,4,16,balanced,0.035114665826161705
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,128,2,32,power_law_1.2,0.08503680229187012
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,128,4,16,balanced,0.04108799993991852
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,128,2,32,power_law_1.2,0.0958079993724823
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,128,2,32,power_law_1.01,3.947846221923828
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,128,4,16,balanced,0.04246933261553446
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,128,2,32,power_law_1.2,0.11911040544509888
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,128,2,32,balanced,0.5755680004755656
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,128,4,16,balanced,0.04274666806062063
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,128,2,32,power_law_1.2,0.14191999435424804
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,128,4,16,balanced,0.046816001335779824
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,128,2,32,power_law_1.2,0.15948159694671632
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,128,4,16,balanced,0.04605866471926371
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,128,2,32,power_law_1.2,0.21527678966522218
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,128,4,16,balanced,0.056757330894470215
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,128,2,32,power_law_1.2,0.292140793800354
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,128,4,16,balanced,0.05250666538874308
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,128,2,32,power_law_1.2,0.46840319633483884
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,128,4,16,balanced,0.05277333160241445
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,128,2,32,power_law_1.2,0.49811840057373047
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,128,2,32,balanced,0.9062773386637369
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,128,4,16,balanced,0.08371200164159139
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,128,2,32,power_law_1.2,0.8270208358764648
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,128,4,16,balanced,0.07426666716734569
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,128,2,32,power_law_1.2,1.2034432411193847
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,128,4,16,balanced,0.0738453318675359
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,128,2,32,power_law_1.2,1.283174419403076
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,128,4,16,balanced,0.07452799876530965
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,128,2,32,power_law_1.2,2.5737024307250977
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,128,4,16,balanced,0.07567999760309856
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,128,4,16,balanced,0.07666133344173431
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,128,4,16,power_law_1.01,0.03473280072212219
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,128,2,32,power_law_1.2,4.982489776611328
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,128,4,16,balanced,0.08231466511885326
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,128,4,16,power_law_1.01,0.04201599955558777
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,128,4,16,power_law_1.01,0.03749119937419891
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,128,4,16,balanced,0.08573333422342937
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,128,4,16,power_law_1.2,0.03492479920387268
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,128,4,16,power_law_1.01,0.039724799990653994
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,128,4,16,balanced,0.09360000491142273
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,128,4,16,power_law_1.01,0.0412992000579834
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,128,4,16,power_law_1.2,0.04183039963245392
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,128,4,16,balanced,0.10089600086212158
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,128,4,16,power_law_1.01,0.0398144006729126
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,128,4,16,power_law_1.2,0.03699199855327606
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,128,4,16,power_law_1.01,0.04397439956665039
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,128,4,16,power_law_1.2,0.03973119854927063
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,128,4,16,balanced,0.11815466483434041
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,128,4,16,power_law_1.01,0.044172799587249754
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,128,2,32,balanced,1.7804746627807617
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,128,4,16,power_law_1.2,0.042099198698997496
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,128,4,16,power_law_1.01,0.05702400207519531
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,128,4,16,balanced,0.1340053379535675
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,128,4,16,power_law_1.2,0.04177280068397522
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,128,4,16,power_law_1.01,0.0522816002368927
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,128,4,16,power_law_1.01,0.055206400156021115
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,128,4,16,power_law_1.2,0.04408960044384003
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,128,4,16,balanced,0.21001599232355753
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,128,4,16,power_law_1.01,0.08330240249633789
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,128,4,16,power_law_1.2,0.045126399397850035
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,128,4,16,power_law_1.01,0.07687039971351624
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,128,4,16,power_law_1.2,0.05886719822883606
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,128,4,16,power_law_1.01,0.08035200238227844
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,128,4,16,power_law_1.2,0.05500159859657287
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,128,4,16,balanced,0.242741326491038
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,128,4,16,power_law_1.01,0.07987200021743775
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,128,4,16,power_law_1.2,0.05594879984855652
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,128,4,16,power_law_1.01,0.07731199860572815
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,128,4,16,power_law_1.01,0.08632959723472595
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,128,4,16,power_law_1.2,0.08042880296707153
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,128,4,16,power_law_1.01,0.08854399919509888
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,128,4,16,power_law_1.2,0.07934079766273498
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,128,4,16,balanced,0.3496319850285848
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,128,4,16,power_law_1.01,0.09534720182418824
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,128,4,16,power_law_1.2,0.08183040022850037
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,128,4,16,power_law_1.01,0.12191359996795655
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,128,4,16,power_law_1.01,0.13662079572677613
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,128,4,16,power_law_1.2,0.07930880188941955
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,128,4,16,power_law_1.01,0.16531200408935548
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,128,4,16,power_law_1.2,0.08303999900817871
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,128,4,16,balanced,0.4535093307495117
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,128,4,16,power_law_1.01,0.20848000049591064
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,128,4,16,power_law_1.2,0.08774399757385254
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,128,8,8,balanced,0.029045333464940388
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,128,4,16,power_law_1.01,0.3061503887176514
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,128,4,16,power_law_1.2,0.09292799830436707
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,128,8,8,balanced,0.03160533308982849
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,128,4,16,power_law_1.01,0.36443519592285156
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,128,4,16,power_law_1.2,0.09812480211257935
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,128,8,8,balanced,0.03269333392381668
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,128,4,16,power_law_1.01,0.48828802108764646
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,128,4,16,power_law_1.2,0.12776960134506227
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,128,8,8,balanced,0.03603200117746989
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,128,4,16,power_law_1.01,0.6893184185028076
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,128,4,16,power_law_1.2,0.14680960178375244
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,128,4,16,balanced,0.5616906483968099
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,128,8,8,balanced,0.03993066648642222
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,128,4,16,power_law_1.01,0.8571264266967773
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,128,4,16,power_law_1.2,0.19607679843902587
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,128,4,16,power_law_1.01,1.2557056427001954
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,128,8,8,balanced,0.04456000030040741
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,128,8,8,balanced,0.04278933505217234
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,128,4,16,power_law_1.2,0.21851520538330077
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,128,4,16,power_law_1.01,2.864531135559082
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,128,8,8,balanced,0.0428959975639979
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,128,4,16,power_law_1.2,0.34926719665527345
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,128,8,8,balanced,0.04689066608746847
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,128,4,16,power_law_1.2,0.435481595993042
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,128,8,8,balanced,0.045754666129748024
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,128,4,16,power_law_1.2,0.5968768119812011
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,128,8,8,balanced,0.04566933214664459
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,128,8,8,balanced,0.05644799768924713
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,128,4,16,power_law_1.2,0.8547455787658691
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,128,4,16,balanced,0.8826133410135905
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,128,8,8,balanced,0.054799998799959816
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,128,4,16,power_law_1.2,1.0200448036193848
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,128,8,8,balanced,0.0551146666208903
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,128,4,16,power_law_1.2,1.7004863739013671
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,128,8,8,balanced,0.08229333162307739
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,128,8,8,power_law_1.01,0.02993920147418976
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,128,8,8,balanced,0.0751200020313263
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,128,4,16,power_law_1.2,4.058560180664062
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,128,8,8,power_law_1.01,0.034272000193595886
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,128,8,8,balanced,0.07880533238252004
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,128,8,8,power_law_1.01,0.03294720053672791
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,128,8,8,balanced,0.08237333099047343
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,128,8,8,power_law_1.01,0.03527680039405823
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,128,8,8,balanced,0.08770666519800822
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,128,8,8,power_law_1.01,0.038540801405906676
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,128,8,8,balanced,0.09639466802279155
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,128,8,8,power_law_1.01,0.043628799915313723
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,128,8,8,balanced,0.10436800122261047
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,128,8,8,power_law_1.01,0.04167680144309997
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,128,8,8,power_law_1.01,0.044582399725914004
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,128,8,8,balanced,0.12313600381215413
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,128,4,16,balanced,1.731082598368327
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,128,8,8,power_law_1.01,0.04769279956817627
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,128,8,8,balanced,0.13980799913406372
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,128,8,8,power_law_1.01,0.04614399969577789
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,128,8,8,power_law_1.01,0.04493440091609955
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,128,8,8,balanced,0.21814932425816855
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,128,8,8,power_law_1.2,0.0298880010843277
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,128,8,8,power_law_1.01,0.05738239884376526
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,128,8,8,power_law_1.2,0.03343360126018524
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,128,8,8,power_law_1.2,0.031302401423454286
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,128,8,8,power_law_1.01,0.0531711995601654
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,128,8,8,balanced,0.25403199593226117
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,128,8,8,power_law_1.2,0.03575679957866669
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,128,8,8,power_law_1.01,0.055270397663116456
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,128,8,8,power_law_1.2,0.037555199861526486
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,128,8,8,power_law_1.2,0.04351359903812409
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,128,8,8,power_law_1.01,0.08262400031089782
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,128,8,8,power_law_1.2,0.04145280122756958
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,128,8,8,power_law_1.01,0.0818880021572113
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,128,8,8,balanced,0.36392001310984295
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,128,8,8,power_law_1.2,0.043910399079322815
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,128,8,8,power_law_1.01,0.08069120049476623
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,128,8,8,power_law_1.2,0.04883840084075928
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,128,8,8,power_law_1.2,0.04538240134716034
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,128,8,8,power_law_1.01,0.08691200017929077
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,128,8,8,power_law_1.2,0.04609920084476471
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,128,8,8,power_law_1.01,0.09171199798583984
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,128,8,8,power_law_1.2,0.05617920160293579
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,128,8,8,balanced,0.4612319866816203
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,128,8,8,power_law_1.01,0.1087488055229187
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,128,8,8,power_law_1.2,0.05467519760131836
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,128,8,8,power_law_1.01,0.12906240224838256
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,128,8,8,power_law_1.2,0.056460797786712646
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,128,8,8,power_law_1.2,0.08595200181007386
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,128,8,8,power_law_1.01,0.16328320503234864
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,128,8,8,power_law_1.2,0.08023679852485657
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,128,8,8,power_law_1.01,0.20171520709991456
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,128,8,8,power_law_1.2,0.0877120018005371
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,128,16,4,balanced,0.027248000105222065
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,128,8,8,power_law_1.01,0.2678656101226807
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,128,8,8,power_law_1.2,0.09196799993515015
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,128,8,8,balanced,0.570581316947937
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,128,8,8,power_law_1.01,0.3378495931625366
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,128,8,8,power_law_1.2,0.09990400075912476
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,128,16,4,balanced,0.02917333443959554
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,128,8,8,power_law_1.2,0.12078720331192017
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,128,16,4,balanced,0.03091199944416682
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,128,8,8,power_law_1.01,0.49838719367980955
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,128,8,8,power_law_1.2,0.14082560539245606
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,128,16,4,balanced,0.03549333413441976
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,128,8,8,power_law_1.01,0.586624002456665
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,128,8,8,power_law_1.2,0.16897280216217042
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,128,16,4,balanced,0.03999999910593033
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,128,8,8,power_law_1.2,0.22140800952911377
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,128,8,8,power_law_1.01,0.7366399765014648
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,128,16,4,balanced,0.048538664976755776
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,128,8,8,power_law_1.2,0.27261440753936766
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,128,8,8,power_law_1.01,1.161068820953369
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,128,8,8,power_law_1.2,0.3788928031921387
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,128,16,4,balanced,0.0481279989083608
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,128,8,8,power_law_1.2,0.5685247898101806
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,128,16,4,power_law_1.01,0.02808319926261902
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,128,8,8,power_law_1.01,2.300441551208496
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,128,16,4,balanced,0.04920533299446106
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,128,8,8,balanced,0.894320011138916
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,128,8,8,power_law_1.2,0.7146495819091797
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,128,16,4,balanced,0.04880533119042715
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,128,16,4,power_law_1.01,0.03194240033626557
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,128,8,8,power_law_1.2,0.8936703681945801
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,128,16,4,balanced,0.04757333298524221
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,128,8,8,power_law_1.2,1.3271552085876466
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,128,16,4,power_law_1.01,0.03134079873561859
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,128,16,4,balanced,0.049829334020614624
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,128,16,4,power_law_1.01,0.03421440124511719
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,128,8,8,power_law_1.2,2.9655616760253904
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,128,16,4,balanced,0.05282133320967356
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,128,16,4,power_law_1.01,0.03953920006752014
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,128,16,4,balanced,0.0532533327738444
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,128,16,4,power_law_1.01,0.0419840008020401
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,128,16,4,power_law_1.01,0.04601599872112274
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,128,16,4,balanced,0.05365333457787832
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,128,16,4,power_law_1.01,0.0457152009010315
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,128,16,4,balanced,0.06252799928188324
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,128,16,4,power_law_1.01,0.04705280065536499
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,128,16,4,balanced,0.06328533093134563
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,128,16,4,power_law_1.01,0.047391998767852786
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,128,16,4,balanced,0.06596266726652782
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,128,16,4,power_law_1.01,0.04850560128688812
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,128,16,4,balanced,0.0979253351688385
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,128,16,4,power_law_1.01,0.05178239941596985
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,128,8,8,balanced,1.7489066123962402
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,128,16,4,balanced,0.10196266571680705
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,128,16,4,power_law_1.01,0.05191680192947388
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,128,16,4,power_law_1.01,0.05479679703712463
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,128,16,4,balanced,0.11069333553314209
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,128,16,4,power_law_1.01,0.06159359812736511
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,128,16,4,balanced,0.11893866459528606
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,128,16,4,power_law_1.01,0.06298239827156067
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,128,16,4,balanced,0.13894933462142944
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,128,16,4,power_law_1.01,0.0646016001701355
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,128,16,4,power_law_1.01,0.10383360385894776
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,128,16,4,balanced,0.15660267074902853
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,128,16,4,power_law_1.2,0.02797439992427826
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,128,16,4,power_law_1.01,0.11622400283813476
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,128,16,4,power_law_1.01,0.1393280029296875
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,128,16,4,power_law_1.2,0.03144319951534271
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,128,16,4,balanced,0.24951465924580893
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,128,16,4,power_law_1.01,0.15326720476150513
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,128,16,4,power_law_1.2,0.03000960052013397
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,128,16,4,power_law_1.2,0.034041601419448855
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,128,16,4,power_law_1.01,0.18372479677200318
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,128,16,4,balanced,0.2855093280474345
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,128,16,4,power_law_1.2,0.039212799072265624
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,128,16,4,power_law_1.01,0.22200961112976075
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,128,16,4,power_law_1.01,0.3092927932739258
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,128,16,4,power_law_1.2,0.04312959909439087
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,128,32,2,balanced,0.02701866626739502
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,128,16,4,power_law_1.2,0.0461760014295578
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,128,16,4,balanced,0.4117973248163859
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,128,16,4,power_law_1.01,0.3766335964202881
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,128,32,2,balanced,0.028837333122889202
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,128,16,4,power_law_1.2,0.04677119851112366
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,128,16,4,power_law_1.01,0.5346560001373291
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,128,32,2,balanced,0.029546665648619335
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,128,16,4,power_law_1.2,0.04682239890098572
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,128,32,2,balanced,0.03489066660404205
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,128,16,4,power_law_1.01,0.6643392086029053
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,128,32,2,balanced,0.041450666884581246
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,128,16,4,power_law_1.2,0.04663040041923523
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,128,16,4,power_law_1.01,0.8033599853515625
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,128,16,4,balanced,0.5369280179341634
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,128,16,4,power_law_1.2,0.048281601071357726
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,128,16,4,power_law_1.01,1.2229248046875
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,128,32,2,balanced,0.05264000097910563
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,128,16,4,power_law_1.2,0.05186560153961182
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,128,32,2,balanced,0.054005334774653115
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,128,16,4,power_law_1.01,2.437766456604004
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,128,16,4,power_law_1.2,0.052121597528457644
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,128,32,2,balanced,0.05299200117588043
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,128,16,4,power_law_1.2,0.05824000239372253
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,128,16,4,balanced,0.6651626825332642
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,128,16,4,power_law_1.2,0.06287360191345215
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,128,32,2,balanced,0.05349866549173991
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,128,32,2,balanced,0.0521919975678126
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,128,16,4,power_law_1.2,0.0695680022239685
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,128,32,2,balanced,0.053685332338015236
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,128,16,4,power_law_1.2,0.07594879865646362
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,128,32,2,balanced,0.05276266733805338
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,128,16,4,power_law_1.2,0.09796479940414429
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,128,32,2,power_law_1.01,0.026969599723815917
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,128,32,2,balanced,0.05339199801286062
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,128,16,4,power_law_1.2,0.1299008011817932
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,128,32,2,balanced,0.05418666700522105
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,128,32,2,power_law_1.01,0.028870400786399842
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,128,16,4,balanced,1.0409493446350098
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,128,16,4,power_law_1.2,0.14434560537338256
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,128,32,2,balanced,0.05931733548641205
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,128,32,2,power_law_1.01,0.02839680016040802
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,128,32,2,balanced,0.060559997955958046
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,128,16,4,power_law_1.2,0.15781760215759277
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,128,32,2,power_law_1.01,0.033504000306129454
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,128,32,2,balanced,0.0631520003080368
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,128,32,2,power_law_1.01,0.03730559945106506
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,128,16,4,power_law_1.2,0.18867839574813844
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,128,32,2,balanced,0.07778133451938629
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,128,16,4,power_law_1.2,0.22848000526428222
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,128,32,2,power_law_1.01,0.04373759925365448
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,128,32,2,balanced,0.08257600168387096
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,128,16,4,power_law_1.2,0.32334079742431643
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,128,32,2,power_law_1.01,0.04759680032730103
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,128,32,2,balanced,0.1277653376261393
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,128,16,4,power_law_1.2,0.4039487838745117
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,128,32,2,power_law_1.01,0.051123201847076416
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,128,16,4,power_law_1.2,0.5634431838989258
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,128,32,2,balanced,0.13709867000579834
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,128,32,2,power_law_1.01,0.05006080269813538
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,128,16,4,power_law_1.2,0.6795904159545898
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,128,32,2,balanced,0.15899200240770975
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,128,32,2,power_law_1.01,0.048851200938224794
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,128,16,4,power_law_1.2,0.9103487968444824
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,128,32,2,power_law_1.01,0.05067520141601563
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,128,32,2,balanced,0.18006932735443115
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,128,16,4,power_law_1.2,1.3613439559936524
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,128,32,2,power_law_1.01,0.05077120065689087
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,128,16,4,balanced,2.0385920206705728
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,128,32,2,balanced,0.2918826738993327
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,128,16,4,power_law_1.2,2.696358489990234
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,128,32,2,power_law_1.01,0.05196160078048706
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,128,32,2,power_law_1.01,0.057920002937316896
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,128,32,2,balanced,0.3330346743265788
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,128,32,2,power_law_1.01,0.05768960118293762
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,128,32,2,power_law_1.01,0.06101760268211365
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,128,32,2,power_law_1.2,0.026848000288009644
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,128,32,2,power_law_1.01,0.07024639844894409
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,128,32,2,balanced,0.4813493490219116
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,128,32,2,power_law_1.2,0.028121599555015565
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,128,32,2,power_law_1.01,0.08707839846611024
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,128,32,2,power_law_1.2,0.028428798913955687
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,128,32,2,power_law_1.2,0.03301759958267212
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,32,2,32,balanced,0.041002665956815086
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,128,32,2,power_law_1.01,0.09427840113639832
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,128,32,2,power_law_1.2,0.03560320138931274
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,128,32,2,power_law_1.2,0.04046719968318939
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,128,32,2,power_law_1.01,0.15457919836044312
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,128,32,2,balanced,0.6288959980010986
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,128,32,2,power_law_1.2,0.046239998936653134
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,32,2,32,balanced,0.04243200023969015
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,128,32,2,power_law_1.01,0.17011200189590453
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,128,32,2,power_law_1.2,0.0487744003534317
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,128,32,2,power_law_1.2,0.04952319860458374
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,128,32,2,power_law_1.01,0.20840320587158204
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,128,32,2,power_law_1.2,0.04904319941997528
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,32,2,32,balanced,0.042266666889190674
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,128,32,2,power_law_1.2,0.050297600030899045
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,128,32,2,power_law_1.01,0.2458944082260132
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,128,32,2,power_law_1.2,0.050911998748779295
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,128,32,2,balanced,0.7774026393890381
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,128,32,2,power_law_1.2,0.05548800230026245
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,128,32,2,power_law_1.01,0.3343744039535522
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,128,32,2,power_law_1.2,0.05912960171699524
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,128,32,2,power_law_1.01,0.40840959548950195
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,128,32,2,power_law_1.2,0.05940480232238769
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,32,2,32,balanced,0.04710933566093445
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,128,32,2,power_law_1.01,0.5626751899719238
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,128,32,2,power_law_1.2,0.06702079772949218
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,128,32,2,power_law_1.2,0.07061759829521179
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,32,2,32,power_law_1.01,0.04094719886779785
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,128,32,2,power_law_1.01,0.7264256000518798
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,128,32,2,power_law_1.2,0.08803200125694274
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,128,32,2,power_law_1.2,0.0945792019367218
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,128,32,2,power_law_1.01,0.8834112167358399
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,32,2,32,power_law_1.01,0.041580799221992495
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,128,32,2,power_law_1.2,0.16033920049667358
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,32,2,32,balanced,0.05097066859404246
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,128,32,2,balanced,1.2144320011138916
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,32,2,32,power_law_1.01,0.040992000699043275
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,128,32,2,power_law_1.01,1.377791976928711
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,128,32,2,power_law_1.2,0.18083200454711915
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,128,32,2,power_law_1.2,0.20945279598236083
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,32,2,32,power_law_1.01,0.04487679898738861
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,128,32,2,power_law_1.01,2.5582143783569338
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,128,32,2,power_law_1.2,0.2550015926361084
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,32,2,32,power_law_1.01,0.048640000820159915
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,128,32,2,power_law_1.2,0.3438976049423218
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,128,32,2,power_law_1.2,0.4385791778564453
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,128,32,2,power_law_1.2,0.6132544040679931
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,128,32,2,power_law_1.2,0.7150144100189209
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,32,2,32,balanced,0.05683733522891998
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,128,32,2,power_law_1.2,0.8890687942504882
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,128,32,2,power_law_1.2,1.408518409729004
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,32,2,32,power_law_1.01,0.05502079725265503
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,128,32,2,power_law_1.2,2.8429824829101564
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,32,2,32,balanced,0.056218668818473816
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,32,2,32,balanced,0.0565280020236969
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,128,32,2,balanced,2.3784693082173667
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,32,2,32,balanced,0.06617600222428639
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,32,2,32,power_law_1.01,0.05602560043334961
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,32,2,32,power_law_1.01,0.05591040253639221
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,32,2,32,balanced,0.06576000154018402
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,32,2,32,power_law_1.01,0.06568959951400757
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,32,2,32,balanced,0.06649066507816315
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,32,2,32,power_law_1.01,0.06558079719543457
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,32,2,32,balanced,0.06592533489068349
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,32,2,32,power_law_1.01,0.06583679914474487
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,32,2,32,balanced,0.0672106643517812
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,32,2,32,power_law_1.01,0.06563839912414551
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,32,2,32,balanced,0.06788266698519389
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,32,2,32,power_law_1.2,0.04137600064277649
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,32,2,32,power_law_1.01,0.06689280271530151
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,32,2,32,balanced,0.0683840016523997
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,32,2,32,power_law_1.01,0.06813439726829529
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,32,2,32,power_law_1.2,0.04221439957618713
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,32,2,32,balanced,0.06836799780527751
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,32,2,32,power_law_1.2,0.04172160029411316
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,32,2,32,power_law_1.01,0.06959360241889953
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,32,2,32,balanced,0.07041066884994507
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,32,2,32,power_law_1.2,0.0457152009010315
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,32,2,32,power_law_1.01,0.06908800005912781
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,32,2,32,balanced,0.07267199953397115
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,32,2,32,power_law_1.2,0.04891520142555237
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,32,2,32,power_law_1.01,0.07109119892120361
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,32,2,32,balanced,0.07558933397134145
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,32,2,32,power_law_1.2,0.05500159859657287
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,32,2,32,power_law_1.01,0.08412160277366638
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,32,2,32,power_law_1.01,0.10559999942779541
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,32,2,32,power_law_1.2,0.056377601623535153
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,32,2,32,balanced,0.08385066191355388
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,32,2,32,power_law_1.01,0.14039039611816406
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,32,2,32,power_law_1.2,0.05655679702758789
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,32,2,32,balanced,0.09241599837938945
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,32,2,32,power_law_1.01,0.18426239490509033
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,32,2,32,power_law_1.2,0.06611199975013733
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,32,2,32,power_law_1.01,0.2353663921356201
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,32,2,32,balanced,0.10909333825111389
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,32,2,32,power_law_1.2,0.06606079936027527
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,32,2,32,power_law_1.01,0.3214848041534424
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,32,2,32,power_law_1.2,0.06688640117645264
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,32,2,32,balanced,0.12948266665140787
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,32,2,32,power_law_1.01,0.47491841316223143
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,32,2,32,power_law_1.2,0.06680960059165955
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,32,2,32,balanced,0.19382933775583902
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,32,2,32,power_law_1.2,0.06752640008926392
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,32,2,32,power_law_1.01,0.5972671985626221
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,32,2,32,power_law_1.2,0.0685696005821228
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,32,2,32,power_law_1.01,0.9684224128723145
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,32,2,32,power_law_1.2,0.06907520294189454
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,32,2,32,balanced,0.2395253380139669
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,32,2,32,power_law_1.01,1.1361599922180177
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,32,2,32,power_law_1.2,0.0701632022857666
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,32,2,32,power_law_1.01,1.5997695922851562
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,32,2,32,power_law_1.2,0.07211520075798035
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,32,2,32,power_law_1.01,2.6553152084350584
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,32,2,32,power_law_1.2,0.1109120011329651
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,32,2,32,balanced,0.34827733039855957
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,32,2,32,power_law_1.2,0.12359039783477783
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,32,2,32,power_law_1.01,5.290425491333008
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,32,4,16,balanced,0.03129599988460541
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,32,4,16,power_law_1.01,0.031052801012992858
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,32,2,32,power_law_1.2,0.16815359592437745
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,32,4,16,balanced,0.03225066761175791
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,32,2,32,power_law_1.2,0.18689919710159303
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,32,4,16,power_law_1.01,0.0318336009979248
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,32,2,32,balanced,0.45163198312123615
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,32,2,32,power_law_1.2,0.27294719219207764
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,32,4,16,balanced,0.03233599911133448
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,32,2,32,power_law_1.2,0.3548799991607666
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,32,4,16,power_law_1.01,0.0320576012134552
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,32,4,16,balanced,0.03700799991687139
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,32,2,32,power_law_1.2,0.524128007888794
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,32,4,16,power_law_1.01,0.035718399286270144
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,32,2,32,power_law_1.2,0.6903744220733643
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,32,2,32,balanced,0.5592693487803141
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,32,2,32,power_law_1.2,1.0203007698059081
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,32,4,16,balanced,0.03899200012286504
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,32,2,32,power_law_1.2,1.347059154510498
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,32,4,16,power_law_1.01,0.03840000033378601
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,32,2,32,power_law_1.2,1.6786624908447265
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,32,2,32,power_law_1.2,2.669113540649414
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,32,4,16,balanced,0.041706666350364685
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,32,2,32,power_law_1.2,5.315244674682617
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,32,4,16,power_law_1.01,0.04110080003738403
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,32,2,32,balanced,0.8826879660288492
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,32,4,16,balanced,0.05003733436266581
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,32,4,16,balanced,0.04946133494377136
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,32,4,16,power_law_1.01,0.04906879961490631
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,32,4,16,power_law_1.01,0.04824320077896118
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,32,4,16,balanced,0.048938666780789696
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,32,4,16,balanced,0.04951466619968414
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,32,4,16,power_law_1.01,0.04867840111255646
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,32,4,16,balanced,0.05176533261934916
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,32,4,16,power_law_1.01,0.049081599712371825
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,32,4,16,balanced,0.05141866703828176
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,32,4,16,power_law_1.01,0.05095679759979248
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,32,4,16,balanced,0.058789332707722984
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,32,4,16,power_law_1.01,0.05127679705619812
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,32,4,16,balanced,0.05860800047715505
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,32,4,16,power_law_1.01,0.05807999968528747
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,32,4,16,balanced,0.0587360014518102
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,32,8,8,balanced,0.027914665639400482
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,32,2,32,balanced,1.741477330525716
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,32,4,16,power_law_1.2,0.03116160035133362
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,32,4,16,power_law_1.01,0.058361601829528806
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,32,4,16,balanced,0.05949866771697998
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,32,8,8,balanced,0.02906133234500885
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,32,4,16,power_law_1.2,0.032313600182533264
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,32,4,16,power_law_1.01,0.059520000219345094
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,32,4,16,balanced,0.061119998494784035
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,32,8,8,balanced,0.029792000850041706
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,32,4,16,power_law_1.2,0.03204480111598969
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,32,4,16,power_law_1.01,0.059628802537918094
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,32,4,16,balanced,0.06346133351325989
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,32,8,8,balanced,0.03439466655254364
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,32,4,16,power_law_1.2,0.03529599905014038
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,32,4,16,power_law_1.01,0.06496000289916992
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,32,4,16,balanced,0.06632000207901001
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,32,4,16,power_law_1.2,0.03829120099544525
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,32,4,16,power_law_1.01,0.07793920040130616
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,32,8,8,power_law_1.01,0.028537601232528687
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,32,8,8,balanced,0.035445332527160645
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,32,4,16,balanced,0.07537066439787547
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,32,4,16,power_law_1.2,0.04175359904766083
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,32,4,16,power_law_1.01,0.08106880187988282
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,32,8,8,power_law_1.01,0.02885119915008545
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,32,4,16,balanced,0.0851146678129832
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,32,4,16,power_law_1.2,0.048416000604629514
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,32,4,16,power_law_1.01,0.13058559894561766
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,32,8,8,power_law_1.01,0.028908801078796387
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,32,8,8,balanced,0.03709866603215536
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,32,4,16,power_law_1.2,0.049004799127578734
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,32,4,16,balanced,0.11204266548156738
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,32,8,8,power_law_1.01,0.033107200264930726
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,32,4,16,power_law_1.01,0.13521920442581176
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,32,4,16,power_law_1.2,0.050406402349472045
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,32,8,8,power_law_1.01,0.03505919873714447
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,32,4,16,power_law_1.01,0.1686079978942871
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,32,8,8,balanced,0.040421334405740104
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,32,4,16,power_law_1.2,0.04963200092315674
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,32,4,16,balanced,0.12839466333389282
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,32,8,8,power_law_1.01,0.037254399061203
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,32,4,16,power_law_1.01,0.2545792102813721
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,32,4,16,power_law_1.2,0.052160000801086424
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,32,8,8,balanced,0.040336000422636666
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,32,8,8,power_law_1.01,0.040780800580978396
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,32,4,16,power_law_1.01,0.35333120822906494
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,32,4,16,power_law_1.2,0.0520576000213623
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,32,4,16,balanced,0.19511467218399048
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,32,8,8,power_law_1.01,0.040524798631668094
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,32,4,16,power_law_1.01,0.4917503833770752
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,32,4,16,power_law_1.2,0.058246397972106935
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,32,4,16,power_law_1.01,0.6632768154144287
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,32,4,16,power_law_1.2,0.05921919941902161
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,32,8,8,balanced,0.04457066456476847
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,32,4,16,power_law_1.01,0.9246015548706055
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,32,4,16,balanced,0.23522667090098062
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,32,4,16,power_law_1.2,0.05932160019874573
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,32,4,16,power_law_1.2,0.05980799794197082
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,32,4,16,power_law_1.01,1.1962112426757812
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,32,8,8,balanced,0.04418133199214935
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,32,8,8,power_law_1.01,0.04456959962844849
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,32,4,16,power_law_1.2,0.06664320230484008
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,32,8,8,balanced,0.04484266539414724
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,32,4,16,power_law_1.01,2.2787519454956056
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,32,8,8,power_law_1.01,0.04506239891052246
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,32,4,16,balanced,0.33938666184743244
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,32,4,16,power_law_1.2,0.07603840231895446
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,32,4,16,power_law_1.01,3.8335617065429686
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,32,8,8,power_law_1.01,0.0451200008392334
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,32,4,16,power_law_1.2,0.08246399760246277
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,32,4,16,power_law_1.2,0.12424319982528687
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,32,8,8,balanced,0.0448586642742157
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,32,4,16,power_law_1.2,0.15942399501800536
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,32,4,16,balanced,0.4426079988479614
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,32,8,8,balanced,0.04580266773700714
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,32,4,16,power_law_1.2,0.21729280948638915
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,32,8,8,power_law_1.01,0.0460671991109848
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,32,8,8,balanced,0.04791999856630961
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,32,4,16,power_law_1.2,0.31960320472717285
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,32,8,8,power_law_1.01,0.046086400747299194
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,32,8,8,balanced,0.048570667703946434
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,32,4,16,power_law_1.2,0.5101823806762695
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,32,8,8,power_law_1.01,0.04958080053329468
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,32,8,8,balanced,0.05576533575852712
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,32,4,16,power_law_1.2,0.5548927783966064
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,32,8,8,power_law_1.01,0.052876800298690796
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,32,4,16,balanced,0.549402674039205
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,32,8,8,balanced,0.057087997595469155
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,32,4,16,power_law_1.2,1.0076800346374513
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,32,8,8,power_law_1.01,0.058316802978515624
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,32,8,8,balanced,0.059418668349583946
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,32,4,16,power_law_1.2,1.2658304214477538
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,32,8,8,power_law_1.01,0.06469119787216186
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,32,8,8,balanced,0.06250666578610738
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,32,4,16,power_law_1.2,1.5744064331054688
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,32,8,8,power_law_1.01,0.07063040137290955
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,32,8,8,balanced,0.07884266475836436
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,32,8,8,power_law_1.01,0.07925760149955749
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,32,4,16,power_law_1.2,2.5855104446411135
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,32,8,8,power_law_1.2,0.02879360020160675
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,32,8,8,power_law_1.01,0.092467200756073
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,32,8,8,balanced,0.0890933374563853
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,32,4,16,power_law_1.2,5.168544006347656
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,32,8,8,power_law_1.01,0.10436480045318604
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,32,8,8,power_law_1.2,0.0289792001247406
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,32,4,16,balanced,0.8629493713378906
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,32,8,8,balanced,0.1123413344224294
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,32,8,8,power_law_1.01,0.15633920431137086
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,32,8,8,power_law_1.2,0.028947201371192933
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,32,8,8,power_law_1.01,0.2143872022628784
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,32,8,8,power_law_1.2,0.03310079872608185
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,32,8,8,balanced,0.1332266628742218
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,32,8,8,power_law_1.2,0.03495680093765259
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,32,8,8,power_law_1.01,0.3334399938583374
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,32,8,8,power_law_1.2,0.037036800384521486
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,32,8,8,balanced,0.20143999656041464
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,32,8,8,power_law_1.01,0.3773695945739746
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,32,8,8,power_law_1.2,0.04059520065784454
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,32,8,8,power_law_1.01,0.5557568073272705
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,32,8,8,power_law_1.2,0.0401856005191803
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,32,8,8,balanced,0.24355733394622803
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,32,8,8,power_law_1.01,0.7857215881347657
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,32,8,8,power_law_1.2,0.04467200040817261
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,32,8,8,power_law_1.01,1.0943743705749511
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,32,8,8,power_law_1.2,0.04542720019817352
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,32,8,8,power_law_1.01,1.3178239822387696
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,32,8,8,power_law_1.2,0.046751999855041505
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,32,8,8,balanced,0.35228268305460614
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,32,8,8,power_law_1.2,0.0459199994802475
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,32,16,4,balanced,0.02619733413060506
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,32,8,8,power_law_1.01,3.1440704345703123
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,32,16,4,balanced,0.028207999964555103
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,32,8,8,power_law_1.2,0.04604800045490265
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,32,4,16,balanced,1.6965333620707195
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,32,16,4,balanced,0.029893333713213604
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,32,16,4,balanced,0.03345066557327906
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,32,8,8,power_law_1.2,0.05177599787712097
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,32,8,8,balanced,0.4492533206939697
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,32,16,4,balanced,0.033786666889985405
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,32,8,8,power_law_1.2,0.05381760001182556
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,32,16,4,balanced,0.033071999748547874
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,32,8,8,power_law_1.2,0.061977601051330565
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,32,8,8,power_law_1.2,0.06421759724617004
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,32,16,4,balanced,0.03605333218971888
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,32,8,8,power_law_1.2,0.07226240038871765
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,32,8,8,balanced,0.5546293258666992
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,32,8,8,power_law_1.2,0.0794048011302948
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,32,16,4,balanced,0.034373333056767784
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,32,8,8,power_law_1.2,0.09653760194778442
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,32,8,8,power_law_1.2,0.13345279693603515
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,32,8,8,power_law_1.2,0.16951040029525757
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,32,16,4,balanced,0.03867733230193456
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,32,16,4,balanced,0.038959999879201256
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,32,8,8,power_law_1.2,0.2516223907470703
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,32,16,4,balanced,0.037818667789300285
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,32,8,8,power_law_1.2,0.34031360149383544
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,32,8,8,balanced,0.870533307393392
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,32,8,8,power_law_1.2,0.4380352020263672
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,32,16,4,power_law_1.01,0.02654080092906952
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,32,8,8,power_law_1.2,0.7254848003387451
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,32,16,4,balanced,0.05152533451716105
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,32,16,4,power_law_1.01,0.028332799673080444
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,32,8,8,power_law_1.2,0.9641280174255371
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,32,16,4,balanced,0.05330666899681091
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,32,16,4,balanced,0.0479360024134318
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,32,16,4,power_law_1.01,0.029318401217460634
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,32,8,8,power_law_1.2,1.12489595413208
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,32,16,4,balanced,0.049813335140546165
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,32,16,4,power_law_1.01,0.031814399361610415
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,32,16,4,balanced,0.053717335065205894
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,32,8,8,power_law_1.2,1.618623924255371
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,32,16,4,power_law_1.01,0.03301759958267212
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,32,16,4,balanced,0.05529066423575083
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,32,16,4,balanced,0.06457599997520447
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,32,16,4,power_law_1.01,0.03288320004940033
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,32,8,8,power_law_1.2,4.512128067016602
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,32,16,4,balanced,0.06860800087451935
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,32,16,4,power_law_1.01,0.03560959994792938
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,32,16,4,balanced,0.08768000205357869
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,32,16,4,power_law_1.01,0.033881598711013795
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,32,16,4,balanced,0.09709866841634114
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,32,16,4,power_law_1.01,0.0392192006111145
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,32,16,4,balanced,0.1239466667175293
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,32,16,4,power_law_1.01,0.0387584000825882
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,32,8,8,balanced,1.711077372233073
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,32,16,4,balanced,0.14881599942843118
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,32,16,4,power_law_1.01,0.03840000033378601
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,32,16,4,power_law_1.01,0.05236480236053467
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,32,16,4,balanced,0.22419732809066772
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,32,16,4,power_law_1.01,0.05418239831924439
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,32,16,4,power_law_1.01,0.050380802154541014
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,32,16,4,balanced,0.27677865823109943
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,32,16,4,power_law_1.01,0.0521664023399353
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,32,16,4,power_law_1.01,0.056531202793121335
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,32,16,4,balanced,0.40057067076365155
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,32,16,4,power_law_1.01,0.060147202014923094
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,32,16,4,power_law_1.2,0.02650879919528961
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,32,16,4,power_law_1.01,0.07325440049171447
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,32,16,4,power_law_1.2,0.028774398565292358
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,32,16,4,power_law_1.01,0.08373759984970093
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,32,16,4,balanced,0.5257759888966879
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,32,16,4,power_law_1.2,0.029440000653266907
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,32,16,4,power_law_1.01,0.09746559858322143
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,32,16,4,power_law_1.2,0.03182719945907593
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,32,16,4,power_law_1.01,0.11963520050048829
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,32,16,4,power_law_1.2,0.03294720053672791
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,32,16,4,power_law_1.2,0.03239679932594299
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,32,16,4,power_law_1.01,0.17178879976272582
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,32,16,4,power_law_1.2,0.035795199871063235
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,32,16,4,power_law_1.01,0.19769599437713622
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,32,16,4,balanced,0.6502933502197266
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,32,16,4,power_law_1.01,0.3089792013168335
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,32,16,4,power_law_1.2,0.03444480001926422
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,32,16,4,power_law_1.01,0.3900288105010986
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,32,16,4,power_law_1.2,0.03930239975452423
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,32,16,4,power_law_1.2,0.039801600575447085
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,32,16,4,power_law_1.01,0.4917888164520264
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,32,16,4,power_law_1.2,0.039417600631713866
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,32,16,4,power_law_1.01,0.7410240173339844
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,32,16,4,power_law_1.2,0.05312640070915222
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,32,16,4,power_law_1.01,0.8467007637023926
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,32,16,4,balanced,1.0241813659667969
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,32,16,4,power_law_1.2,0.054425597190856934
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,32,16,4,power_law_1.01,1.532857608795166
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,32,32,2,balanced,0.02571200082699458
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,32,16,4,power_law_1.2,0.05788159966468811
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,32,16,4,power_law_1.01,3.087980842590332
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,32,16,4,power_law_1.2,0.05655679702758789
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,32,32,2,balanced,0.02743999908367793
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,32,32,2,balanced,0.027978666126728058
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,32,16,4,power_law_1.2,0.05726720094680786
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,32,32,2,balanced,0.03339733431736628
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,32,16,4,power_law_1.2,0.06106240153312683
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,32,32,2,balanced,0.03356799980004629
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,32,16,4,power_law_1.2,0.07676159739494323
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,32,32,2,balanced,0.03403199960788091
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,32,16,4,power_law_1.2,0.08140159845352173
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,32,32,2,balanced,0.034602666894594826
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,32,16,4,power_law_1.2,0.09800320267677307
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,32,32,2,balanced,0.03374933451414108
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,32,16,4,power_law_1.2,0.14050559997558593
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,32,16,4,power_law_1.2,0.17848960161209107
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,32,32,2,balanced,0.03611200054486593
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,32,16,4,power_law_1.2,0.2458240032196045
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,32,16,4,balanced,2.006453355153402
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,32,32,2,balanced,0.036133334040641785
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,32,16,4,power_law_1.2,0.3550463914871216
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,32,16,4,power_law_1.2,0.454860782623291
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,32,16,4,power_law_1.2,0.604531192779541
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,32,32,2,balanced,0.035242666800816856
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,32,32,2,power_law_1.01,0.025887998938560485
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,32,16,4,power_law_1.2,0.7767551898956299
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,32,32,2,power_law_1.2,0.02558720111846924
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,32,32,2,power_law_1.01,0.02705279886722565
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,32,16,4,power_law_1.2,1.0886079788208007
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,32,32,2,power_law_1.01,0.027110400795936584
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,32,32,2,power_law_1.2,0.026924800872802735
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,32,32,2,balanced,0.04134399940570196
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,32,16,4,power_law_1.2,1.6684415817260743
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,32,32,2,power_law_1.2,0.027001601457595826
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,32,32,2,power_law_1.01,0.030873599648475646
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,32,32,2,balanced,0.0423573354880015
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,32,32,2,power_law_1.2,0.030483201146125793
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,32,32,2,power_law_1.01,0.03261440098285675
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,32,16,4,power_law_1.2,3.503206253051758
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,32,32,2,power_law_1.2,0.03270399868488312
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,32,32,2,power_law_1.01,0.03369599878787995
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,32,32,2,balanced,0.04058133314053217
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,32,32,2,power_law_1.2,0.03346560001373291
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,32,32,2,power_law_1.01,0.034220799803733826
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,32,32,2,power_law_1.2,0.03392640054225922
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,32,32,2,power_law_1.01,0.03456639945507049
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,32,32,2,power_law_1.2,0.03475199937820435
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,32,32,2,power_law_1.01,0.037625598907470706
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,32,32,2,balanced,0.055359999338785805
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,32,32,2,power_law_1.2,0.03813759982585907
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,32,32,2,power_law_1.01,0.03758080005645752
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,32,32,2,balanced,0.057029331723848976
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,32,32,2,power_law_1.2,0.037862399220466615
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,32,32,2,power_law_1.01,0.03899520039558411
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,32,32,2,power_law_1.2,0.03871999979019165
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,32,32,2,power_law_1.01,0.04206719994544983
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,32,32,2,power_law_1.2,0.04207360148429871
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,32,32,2,power_law_1.01,0.0430976003408432
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,32,32,2,power_law_1.2,0.0423552006483078
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,32,32,2,balanced,0.05492799977461497
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,32,32,2,power_law_1.01,0.04415999948978424
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,32,32,2,power_law_1.2,0.044300800561904906
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,4096,14336,2,8,16,8,balanced,0.03138133386770884
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,32,32,2,balanced,0.06402133405208588
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,32,32,2,power_law_1.01,0.060755199193954466
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,32,32,2,power_law_1.2,0.060703998804092406
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,4096,14336,2,8,16,8,balanced,0.031445334355036415
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,32,32,2,balanced,0.07111466427644093
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,32,32,2,power_law_1.01,0.06240000128746033
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,32,32,2,power_law_1.2,0.063264000415802
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,4096,14336,2,8,16,8,balanced,0.031328000128269196
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,32,32,2,power_law_1.01,0.06614400148391723
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,32,32,2,balanced,0.09633066256841023
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,32,32,2,power_law_1.2,0.06684160232543945
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,4096,14336,2,8,16,8,balanced,0.032261334359645844
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,4096,14336,2,8,16,8,balanced,0.0340693344672521
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,32,32,2,power_law_1.01,0.07599999904632568
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,32,32,2,power_law_1.2,0.07701119780540466
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,4096,14336,2,8,16,8,balanced,0.03219199925661087
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,32,32,2,balanced,0.10630933443705241
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,4096,14336,2,8,16,8,balanced,0.03369066615899404
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,32,32,2,power_law_1.01,0.08266879916191101
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,32,32,2,power_law_1.2,0.084934401512146
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,4096,14336,2,8,16,8,balanced,0.033029332756996155
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,4096,14336,2,8,16,8,balanced,0.0344106654326121
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,32,32,2,balanced,0.1381493310133616
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,32,32,2,power_law_1.01,0.10444799661636353
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,4096,14336,2,8,16,8,balanced,0.03346133232116699
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,32,32,2,power_law_1.2,0.10438400506973267
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,4096,14336,2,8,16,8,balanced,0.03773866593837738
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,4096,14336,2,8,16,8,balanced,0.03631466627120972
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,32,32,2,power_law_1.01,0.11848959922790528
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,32,32,2,power_law_1.2,0.11914240121841431
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,32,32,2,balanced,0.17080533504486084
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,4096,14336,2,8,16,8,balanced,0.03786666691303253
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,4096,14336,2,8,16,8,balanced,0.03695466617743174
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,32,32,2,power_law_1.01,0.16895999908447265
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,32,32,2,power_law_1.2,0.17943040132522584
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,4096,14336,2,8,16,8,balanced,0.03828266759713491
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,4096,14336,2,8,16,8,balanced,0.03648533423741659
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,32,32,2,power_law_1.01,0.22929279804229735
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,32,32,2,power_law_1.2,0.23462400436401368
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,32,32,2,balanced,0.25702933470408124
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,4096,14336,2,8,16,8,balanced,0.03796799977620443
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,4096,14336,2,8,16,8,balanced,0.036992001036802925
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,32,32,2,power_law_1.2,0.3308799982070923
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,32,32,2,power_law_1.01,0.3068351984024048
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,4096,14336,2,8,16,8,balanced,0.038373333712418876
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,4096,14336,2,8,16,8,balanced,0.0367253323396047
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,32,32,2,power_law_1.2,0.4351168155670166
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,32,32,2,power_law_1.01,0.4101888179779053
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,32,32,2,balanced,0.3216106692949931
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,4096,14336,2,8,16,8,balanced,0.03873066604137421
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,4096,14336,2,8,16,8,balanced,0.03738133360942205
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,32,32,2,power_law_1.2,0.573964786529541
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,32,32,2,power_law_1.01,0.558835220336914
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,4096,14336,2,8,16,8,balanced,0.038975998759269714
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,4096,14336,2,8,16,8,balanced,0.03739733248949051
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,32,32,2,power_law_1.2,0.8734848022460937
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,32,32,2,power_law_1.01,0.7872960090637207
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,4096,14336,2,8,16,8,balanced,0.04206933577855428
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,4096,14336,2,8,16,8,balanced,0.03866666555404663
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,4096,14336,2,8,16,8,balanced,0.0436160018046697
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,32,32,2,balanced,0.46836801369984943
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,32,32,2,power_law_1.2,0.9054911613464356
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,32,32,2,power_law_1.01,0.8886336326599121
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,4096,14336,2,8,16,8,balanced,0.03844800094763438
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,4096,14336,2,8,16,8,balanced,0.043391997615496315
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,32,32,2,power_law_1.2,1.6408447265625
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,32,32,2,power_law_1.01,1.5229439735412598
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,4096,14336,2,8,16,8,balanced,0.03849600007136663
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,4096,14336,2,8,16,8,balanced,0.04785599807898203
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,4096,14336,2,8,16,8,balanced,0.03752533346414566
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,4096,14336,2,8,16,8,balanced,0.046367997924486794
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,32,32,2,power_law_1.01,2.7166976928710938
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,32,32,2,power_law_1.2,3.1044864654541016
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,4096,14336,2,8,16,8,balanced,0.040991999208927155
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,4096,14336,2,8,16,8,balanced,0.06571733454863231
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,32,32,2,balanced,0.6144533157348633
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,4096,14336,2,8,16,8,balanced,0.04083733260631561
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,4096,14336,2,8,16,8,balanced,0.05829333265622457
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,4096,14336,2,8,16,8,balanced,0.042394667863845825
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,4096,14336,2,8,16,8,balanced,0.08122666676839192
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,4096,14336,2,8,16,8,balanced,0.05095999936262766
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,4096,14336,2,8,16,8,balanced,0.04822933177153269
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,32,32,2,balanced,0.7616373697916666
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,4096,14336,2,8,16,8,balanced,0.07911466558774312
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,4096,14336,2,8,16,8,balanced,0.06776000062624614
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,4096,14336,2,8,16,8,balanced,0.12139733632405598
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,4096,14336,2,8,16,8,balanced,0.07130666573842366
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,4096,14336,2,8,16,8,balanced,0.09609066446622212
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,4096,14336,2,8,16,8,balanced,0.1290720005830129
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,4096,14336,2,8,16,8,balanced,0.10713066657384236
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,4096,14336,2,8,16,8,balanced,0.025519999365011852
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,4096,14336,2,8,16,8,balanced,0.1984000007311503
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,32,32,2,balanced,1.191701332728068
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,4096,14336,2,8,16,8,balanced,0.15126400192578635
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,4096,14336,2,8,16,8,balanced,0.025557334224383037
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,4096,14336,2,8,16,8,balanced,0.02550400048494339
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,4096,14336,2,8,16,8,balanced,0.17547200123469034
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,4096,14336,2,8,16,8,balanced,0.2301386594772339
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,4096,14336,2,8,16,8,balanced,0.027471999327341717
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,4096,14336,2,8,16,8,balanced,0.027717334528764088
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,4096,14336,2,8,16,8,balanced,0.0281333327293396
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,4096,14336,2,8,16,8,balanced,0.25517332553863525
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,4096,14336,2,8,16,8,balanced,0.028202667832374573
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,4096,14336,2,8,16,8,balanced,0.29820799827575684
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,4096,14336,2,8,16,8,balanced,0.027989332874615986
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,4096,14336,2,8,16,8,balanced,0.31496532758076984
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,4096,14336,2,8,16,8,balanced,0.02829333394765854
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,4096,14336,2,8,16,8,balanced,0.028783999383449554
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,4096,14336,2,8,16,8,power_law_1.01,0.030611199140548707
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,4096,14336,2,8,16,8,balanced,0.42713598410288495
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,4096,14336,2,8,16,8,balanced,0.3927253484725952
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,4096,14336,2,8,16,8,power_law_1.01,0.03086079955101013
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,4096,14336,2,8,16,8,power_law_1.01,0.03052160143852234
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,4096,14336,2,8,16,8,balanced,0.02828266719977061
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,4096,14336,2,8,16,8,power_law_1.01,0.03218559920787811
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,4096,14336,2,8,16,8,balanced,0.02923733244339625
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,4096,14336,2,8,16,8,power_law_1.01,0.03196159899234772
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,32,32,2,balanced,2.341493288675944
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,4096,14336,2,8,16,8,power_law_1.01,0.04030719995498657
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,4096,14336,2,8,16,8,balanced,0.5890453259150187
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,4096,14336,2,8,16,8,balanced,0.029951999584833782
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,4096,14336,2,8,16,8,power_law_1.01,0.03366400003433227
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,4096,14336,2,8,16,8,power_law_1.01,0.042777600884437564
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,4096,14336,2,8,16,8,balanced,0.028522667785485584
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,4096,14336,2,8,16,8,power_law_1.01,0.033792001008987424
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,4096,14336,2,8,16,8,power_law_1.01,0.03798399865627289
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,4096,14336,2,8,16,8,power_law_1.01,0.03365119993686676
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,4096,14336,2,8,16,8,balanced,0.7619040012359619
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,4096,14336,2,8,16,8,power_law_1.01,0.040166398882865904
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,4096,14336,2,8,16,8,power_law_1.01,0.03621760010719299
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,4096,14336,2,8,16,8,power_law_1.01,0.035750401020050046
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,4096,14336,2,8,16,8,power_law_1.01,0.03925760090351105
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,4096,14336,2,8,16,8,power_law_1.01,0.036320000886917114
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,4096,14336,2,8,16,8,power_law_1.01,0.03473919928073883
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,4096,14336,2,8,16,8,power_law_1.01,0.04078719913959503
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,4096,14336,2,8,16,8,balanced,0.03514666606982549
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,4096,14336,2,8,16,8,power_law_1.01,0.03578239977359772
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,4096,14336,2,8,16,8,power_law_1.01,0.04708479940891266
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,4096,14336,2,8,16,8,power_law_1.01,0.0367935985326767
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,4096,14336,2,8,16,8,balanced,0.03527999917666117
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,4096,14336,2,8,16,8,power_law_1.01,0.03784320056438446
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,4096,14336,2,8,16,8,balanced,1.1219200293223064
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,4096,14336,2,8,16,8,power_law_1.01,0.047417598962783816
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,4096,14336,2,8,16,8,power_law_1.01,0.03933440148830414
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,4096,14336,2,8,16,8,balanced,0.035258665680885315
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,4096,14336,2,8,16,8,power_law_1.01,0.048614400625228885
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,4096,14336,2,8,16,8,power_law_1.01,0.04095999896526337
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,4096,14336,2,8,16,8,power_law_1.01,0.04058879911899567
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,4096,14336,2,8,16,8,power_law_1.01,0.06335999965667724
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,4096,14336,2,8,16,8,power_law_1.01,0.0406464010477066
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,4096,14336,2,8,16,8,power_law_1.01,0.052857601642608644
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,4096,14336,2,8,16,8,power_law_1.01,0.07129600048065185
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,4096,14336,2,8,16,8,power_law_1.01,0.053523200750350955
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,4096,14336,2,8,16,8,power_law_1.01,0.0674239993095398
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,4096,14336,2,8,16,8,power_law_1.01,0.05726079940795899
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,4096,14336,2,8,16,8,balanced,0.041322665909926094
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,4096,14336,2,8,16,8,power_law_1.01,0.0839680016040802
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,4096,14336,2,8,16,8,power_law_1.01,0.08079360127449035
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,4096,14336,2,8,16,8,balanced,0.04269866645336151
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,4096,14336,2,8,16,8,power_law_1.01,0.08948479890823365
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,4096,14336,2,8,16,8,power_law_1.01,0.08117120265960694
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,4096,14336,2,8,16,8,power_law_1.01,0.12621439695358277
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,4096,14336,2,8,16,8,power_law_1.01,0.10257920026779174
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,4096,14336,2,8,16,8,power_law_1.01,0.11257599592208863
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,4096,14336,2,8,16,8,power_law_1.01,0.1345728039741516
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,4096,14336,2,8,16,8,power_law_1.01,0.15520000457763672
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,4096,14336,2,8,16,8,power_law_1.01,0.18410880565643312
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,4096,14336,2,8,16,8,power_law_1.01,0.1817471981048584
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,4096,14336,2,8,16,8,power_law_1.01,0.24113919734954833
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,4096,14336,2,8,16,8,power_law_1.01,0.21683840751647948
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,4096,14336,2,8,16,8,power_law_1.01,0.33943679332733157
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,4096,14336,2,8,16,8,power_law_1.01,0.3035007953643799
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,4096,14336,2,8,16,8,balanced,0.05110399921735128
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,4096,14336,2,8,16,8,power_law_1.01,0.5021056175231934
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,4096,14336,2,8,16,8,power_law_1.01,0.601804780960083
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,4096,14336,2,8,16,8,power_law_1.01,0.3418175935745239
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,4096,14336,2,8,16,8,power_law_1.01,0.8306559562683106
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,4096,14336,2,8,16,8,power_law_1.01,0.49245438575744627
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,4096,14336,2,8,16,8,power_law_1.01,1.2569024085998535
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,4096,14336,2,8,16,8,power_law_1.01,0.6695424079895019
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,4096,14336,2,8,16,8,power_law_1.01,2.3946943283081055
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,4096,14336,2,8,16,8,power_law_1.01,0.7648640155792237
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,4096,14336,2,8,16,8,power_law_1.01,1.4721664428710937
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,4096,14336,2,8,16,8,balanced,0.060640002290407814
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,4096,14336,2,8,16,8,power_law_1.01,2.452838325500488
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,4096,14336,2,8,16,8,balanced,0.0780320018529892
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,4096,14336,2,8,16,8,power_law_1.2,0.030847999453544616
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,4096,14336,2,8,16,8,power_law_1.2,0.03091199994087219
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,4096,14336,2,8,16,8,balanced,0.09248000383377075
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,4096,14336,2,8,16,8,power_law_1.2,0.03073279857635498
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,4096,14336,2,8,16,8,power_law_1.2,0.03185279965400696
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,4096,14336,2,8,16,8,balanced,0.12990933656692505
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,4096,14336,2,8,16,8,power_law_1.01,0.024908800423145295
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,4096,14336,2,8,16,8,power_law_1.2,0.03234559893608093
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,4096,14336,2,8,16,8,balanced,0.1600266695022583
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,4096,14336,2,8,16,8,power_law_1.01,0.024742400646209715
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,4096,14336,2,8,16,8,power_law_1.2,0.04237439930438995
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,4096,14336,2,8,16,8,power_law_1.01,0.024985599517822265
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,4096,14336,2,8,16,8,power_law_1.2,0.04301440119743347
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,4096,14336,2,8,16,8,power_law_1.01,0.026707199215888978
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,4096,14336,2,8,16,8,balanced,0.23669334252675375
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,4096,14336,2,8,16,8,power_law_1.2,0.03804160058498383
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,4096,14336,2,8,16,8,power_law_1.01,0.026956799626350402
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,4096,14336,2,8,16,8,power_law_1.2,0.03956480026245117
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,4096,14336,2,8,16,8,power_law_1.01,0.027481600642204285
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,4096,14336,2,8,16,8,power_law_1.2,0.03991680145263672
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,4096,14336,2,8,16,8,balanced,0.321834663550059
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,4096,14336,2,8,16,8,power_law_1.01,0.0281792014837265
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,4096,14336,2,8,16,8,power_law_1.2,0.041119998693466185
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,4096,14336,2,8,16,8,power_law_1.01,0.02874239981174469
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,4096,14336,2,8,16,8,power_law_1.2,0.0463808000087738
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,4096,14336,2,8,16,8,power_law_1.01,0.030451199412345885
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,4096,14336,2,8,16,8,power_law_1.01,0.031148800253868104
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,4096,14336,2,8,16,8,balanced,0.3964960177739461
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,4096,14336,2,8,16,8,power_law_1.2,0.054022401571273804
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,4096,14336,2,8,16,8,power_law_1.2,0.05356799960136414
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,4096,14336,2,8,16,8,power_law_1.2,0.06527360081672669
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,4096,14336,2,8,16,8,power_law_1.01,0.036748799681663516
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,4096,14336,2,8,16,8,power_law_1.2,0.06956160068511963
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,4096,14336,2,8,16,8,power_law_1.01,0.04258559942245484
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,4096,14336,2,8,16,8,power_law_1.2,0.06481919884681701
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,4096,14336,2,8,16,8,balanced,0.6057493289311727
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,4096,14336,2,8,16,8,power_law_1.01,0.04059520065784454
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,4096,14336,2,8,16,8,power_law_1.2,0.08167679905891419
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,4096,14336,2,8,16,8,power_law_1.01,0.050425601005554196
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,4096,14336,2,8,16,8,power_law_1.2,0.09436799883842469
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,4096,14336,2,8,16,8,power_law_1.2,0.13374719619750977
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,4096,14336,2,8,16,8,power_law_1.2,0.13178880214691163
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,4096,14336,2,8,16,8,power_law_1.01,0.05183359980583191
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,4096,14336,2,8,16,8,power_law_1.2,0.1717311978340149
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,4096,14336,2,8,16,8,power_law_1.01,0.057036799192428586
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,4096,14336,2,8,16,8,power_law_1.2,0.19701759815216063
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,4096,14336,2,8,16,8,power_law_1.01,0.06817920207977295
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,4096,14336,2,8,16,8,balanced,1.1962453524271648
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,4096,14336,2,8,16,8,power_law_1.2,0.3129472017288208
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,4096,14336,2,8,16,8,power_law_1.2,0.3665472030639648
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,4096,14336,2,8,16,8,power_law_1.2,0.49298558235168455
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,4096,14336,2,8,16,8,power_law_1.2,0.03335680067539215
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,4096,14336,2,8,16,8,power_law_1.01,0.07623040080070495
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,4096,14336,2,8,16,8,power_law_1.2,0.6728320121765137
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,4096,14336,2,8,16,8,power_law_1.01,0.08888319730758668
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,4096,14336,2,8,16,8,power_law_1.2,0.0336896002292633
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,4096,14336,2,8,16,8,power_law_1.2,0.8254336357116699
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,4096,14336,2,8,16,8,power_law_1.2,0.033529600501060484
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,4096,14336,2,8,16,8,power_law_1.2,1.4575167655944825
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,4096,14336,2,8,16,8,power_law_1.2,0.035769599676132205
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,4096,14336,2,8,16,8,power_law_1.01,0.11359360218048095
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,4096,14336,2,8,16,8,power_law_1.2,0.03575679957866669
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,4096,14336,2,8,16,8,power_law_1.2,2.520377540588379
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,4096,14336,2,8,16,8,power_law_1.2,0.03621760010719299
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,4096,14336,2,8,16,8,power_law_1.2,0.024902400374412537
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,4096,14336,2,8,32,4,balanced,0.03266133368015289
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,4096,14336,2,8,16,8,power_law_1.2,0.035980799794197084
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,4096,14336,2,8,16,8,power_law_1.01,0.14128639698028564
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,4096,14336,2,8,16,8,power_law_1.2,0.024908800423145295
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,4096,14336,2,8,32,4,balanced,0.029466666281223297
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,4096,14336,2,8,16,8,power_law_1.2,0.03592959940433502
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,4096,14336,2,8,16,8,power_law_1.01,0.2082751989364624
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,4096,14336,2,8,32,4,balanced,0.029717333614826202
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,4096,14336,2,8,16,8,power_law_1.2,0.036575999855995175
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,4096,14336,2,8,16,8,power_law_1.2,0.024915200471878052
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,4096,14336,2,8,32,4,balanced,0.030778666337331135
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,4096,14336,2,8,16,8,power_law_1.2,0.03683840036392212
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,4096,14336,2,8,16,8,power_law_1.2,0.026598399877548216
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,4096,14336,2,8,16,8,power_law_1.01,0.222707200050354
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,4096,14336,2,8,32,4,balanced,0.03068800022204717
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,4096,14336,2,8,16,8,power_law_1.2,0.03929600119590759
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,4096,14336,2,8,16,8,power_law_1.2,0.027020800113677978
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,4096,14336,2,8,16,8,power_law_1.01,0.4075007915496826
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,4096,14336,2,8,32,4,balanced,0.031386665999889374
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,4096,14336,2,8,16,8,power_law_1.2,0.04115839898586273
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,4096,14336,2,8,16,8,power_law_1.2,0.027590399980545043
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,4096,14336,2,8,16,8,power_law_1.01,0.4742784023284912
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,4096,14336,2,8,32,4,balanced,0.032816000282764435
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,4096,14336,2,8,16,8,power_law_1.2,0.04038400053977966
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,4096,14336,2,8,16,8,power_law_1.2,0.02800000011920929
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,4096,14336,2,8,16,8,power_law_1.01,0.7997375965118408
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,4096,14336,2,8,32,4,balanced,0.0367253323396047
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,4096,14336,2,8,16,8,power_law_1.2,0.04215039908885956
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,4096,14336,2,8,16,8,power_law_1.2,0.02865920066833496
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,4096,14336,2,8,32,4,balanced,0.036746665835380554
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,4096,14336,2,8,16,8,power_law_1.01,1.0608192443847657
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,4096,14336,2,8,16,8,power_law_1.2,0.04830079972743988
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,4096,14336,2,8,32,4,balanced,0.03707200040419897
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,4096,14336,2,8,16,8,power_law_1.2,0.029862400889396668
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,4096,14336,2,8,16,8,power_law_1.01,1.244211196899414
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,4096,14336,2,8,16,8,power_law_1.2,0.05546879768371582
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,4096,14336,2,8,32,4,balanced,0.03745066622893015
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,4096,14336,2,8,16,8,power_law_1.2,0.030348798632621764
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,4096,14336,2,8,16,8,power_law_1.01,2.028544044494629
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,4096,14336,2,8,32,4,balanced,0.03812800099452337
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,4096,14336,2,8,16,8,power_law_1.2,0.06060799956321716
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,4096,14336,2,8,32,4,balanced,0.0383840004603068
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,4096,14336,2,8,16,8,power_law_1.2,0.0837440013885498
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,4096,14336,2,8,16,8,power_law_1.01,4.009286499023437
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,4096,14336,2,8,16,8,power_law_1.2,0.036236798763275145
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,4096,14336,2,8,32,4,balanced,0.03920000046491623
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,4096,14336,2,8,32,4,balanced,0.03200533241033554
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,4096,14336,2,8,16,8,power_law_1.2,0.08236799836158752
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,4096,14336,2,8,16,8,power_law_1.2,0.041305598616600034
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,4096,14336,2,8,32,4,balanced,0.04261333247025808
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,4096,14336,2,8,32,4,balanced,0.03179733455181122
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,4096,14336,2,8,16,8,power_law_1.2,0.11091840267181396
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,4096,14336,2,8,32,4,balanced,0.044351999958356224
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,4096,14336,2,8,16,8,power_law_1.2,0.0429504007101059
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,4096,14336,2,8,32,4,balanced,0.03629333277543386
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,4096,14336,2,8,16,8,power_law_1.2,0.11182719469070435
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,4096,14336,2,8,32,4,balanced,0.03435733417669932
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,4096,14336,2,8,32,4,balanced,0.04739200075467428
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,4096,14336,2,8,16,8,power_law_1.2,0.05242239832878113
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,4096,14336,2,8,32,4,balanced,0.03590933233499527
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,4096,14336,2,8,16,8,power_law_1.2,0.1605631947517395
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,4096,14336,2,8,32,4,balanced,0.03472000112136205
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,4096,14336,2,8,32,4,balanced,0.05865600208441416
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,4096,14336,2,8,32,4,balanced,0.035274667044480644
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,4096,14336,2,8,16,8,power_law_1.2,0.17990399599075318
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,4096,14336,2,8,32,4,balanced,0.05154666801293691
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,4096,14336,2,8,32,4,balanced,0.034874667723973594
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,4096,14336,2,8,16,8,power_law_1.2,0.2641792058944702
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,4096,14336,2,8,16,8,power_law_1.2,0.05448319911956787
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,4096,14336,2,8,32,4,balanced,0.035786665976047516
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,4096,14336,2,8,32,4,balanced,0.07115200161933899
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,4096,14336,2,8,32,4,balanced,0.03620799879233042
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,4096,14336,2,8,16,8,power_law_1.2,0.32804479598999026
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,4096,14336,2,8,16,8,power_law_1.2,0.057555198669433594
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,4096,14336,2,8,32,4,balanced,0.03619733452796936
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,4096,14336,2,8,32,4,balanced,0.06651733318964641
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,4096,14336,2,8,16,8,power_law_1.2,0.5014336109161377
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,4096,14336,2,8,16,8,power_law_1.2,0.07004799842834472
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,4096,14336,2,8,32,4,balanced,0.03698666642109553
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,4096,14336,2,8,16,8,power_law_1.2,0.661836814880371
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,4096,14336,2,8,32,4,balanced,0.03754133234421412
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,4096,14336,2,8,32,4,balanced,0.08948799967765808
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,4096,14336,2,8,32,4,balanced,0.038922667503356934
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,4096,14336,2,8,16,8,power_law_1.2,0.8263936042785645
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,4096,14336,2,8,32,4,balanced,0.04258666435877482
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,4096,14336,2,8,32,4,balanced,0.09118933478991191
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,4096,14336,2,8,16,8,power_law_1.2,0.07222399711608887
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,4096,14336,2,8,32,4,balanced,0.04223466912905375
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,4096,14336,2,8,16,8,power_law_1.2,1.3188544273376466
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,4096,14336,2,8,32,4,balanced,0.1343839963277181
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,4096,14336,2,8,32,4,balanced,0.04498666524887085
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,4096,14336,2,8,16,8,power_law_1.2,0.09085440039634704
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,4096,14336,2,8,16,8,power_law_1.2,2.4040895462036134
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,4096,14336,2,8,32,4,balanced,0.049653331438700356
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,4096,14336,2,8,32,4,balanced,0.0537013312180837
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,4096,14336,2,8,32,4,balanced,0.15558933218320212
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,4096,14336,2,8,32,4,balanced,0.07083733379840851
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,4096,14336,2,8,32,4,balanced,0.024959998826185863
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,4096,14336,2,8,16,8,power_law_1.2,0.11682560443878173
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,4096,14336,2,8,32,4,balanced,0.07780799766381581
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,4096,14336,2,8,32,4,balanced,0.025029333929220837
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,4096,14336,2,8,32,4,balanced,0.23934932549794516
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,4096,14336,2,8,32,4,balanced,0.10496532917022705
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,4096,14336,2,8,32,4,balanced,0.02518400053183238
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,4096,14336,2,8,32,4,balanced,0.11772267023722331
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,4096,14336,2,8,16,8,power_law_1.2,0.135808002948761
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,4096,14336,2,8,32,4,balanced,0.02701333413521449
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,4096,14336,2,8,32,4,balanced,0.2810239990552266
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,4096,14336,2,8,32,4,balanced,0.1674720048904419
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,4096,14336,2,8,32,4,balanced,0.027877333263556164
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,4096,14336,2,8,16,8,power_law_1.2,0.21220479011535645
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,4096,14336,2,8,32,4,balanced,0.2015413244565328
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,4096,14336,2,8,32,4,balanced,0.02829333394765854
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,4096,14336,2,8,32,4,balanced,0.35939733187357586
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,4096,14336,2,8,32,4,balanced,0.028362666567166645
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,4096,14336,2,8,16,8,power_law_1.2,0.26654720306396484
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,4096,14336,2,8,32,4,balanced,0.2974666754404704
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,4096,14336,2,8,16,8,power_law_1.2,0.41452798843383787
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,4096,14336,2,8,32,4,balanced,0.028117333849271137
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,4096,14336,2,8,16,8,power_law_1.2,0.5056704044342041
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,4096,14336,2,8,32,4,balanced,0.02903466671705246
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,4096,14336,2,8,32,4,balanced,0.36956799030303955
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,4096,14336,2,8,16,8,power_law_1.2,0.796940803527832
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,4096,14336,2,8,32,4,balanced,0.029701332251230877
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,4096,14336,2,8,32,4,balanced,0.5196106831232706
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,4096,14336,2,8,16,8,power_law_1.2,0.9720576286315918
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,4096,14336,2,8,16,8,power_law_1.2,1.2908479690551757
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,4096,14336,2,8,32,4,balanced,0.46246933937072754
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,4096,14336,2,8,16,8,power_law_1.2,1.9780672073364258
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,4096,14336,2,8,32,4,balanced,0.029669334491093952
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,4096,14336,2,8,16,8,power_law_1.2,4.0105022430419925
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,4096,14336,2,8,32,4,balanced,0.030266667405764263
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,4096,14336,2,8,32,4,balanced,0.03128000100453695
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,4096,14336,2,8,32,4,balanced,0.6998666922251383
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,4096,14336,2,8,32,4,balanced,0.030602666238943737
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,4096,14336,2,8,32,4,balanced,0.9453813234965006
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,4096,14336,2,8,32,4,balanced,0.03788266579310099
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,4096,14336,2,8,32,4,balanced,0.03827200084924698
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,4096,14336,2,8,32,4,power_law_1.01,0.032793599367141726
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,4096,14336,2,8,32,4,balanced,1.4287573496500652
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,4096,14336,2,8,32,4,balanced,0.03896533449490865
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,4096,14336,2,8,32,4,power_law_1.01,0.029209598898887634
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,4096,14336,2,8,32,4,power_law_1.01,0.02908160090446472
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,4096,14336,2,8,32,4,power_law_1.01,0.03022719919681549
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,4096,14336,2,8,32,4,balanced,0.04663466910521189
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,4096,14336,2,8,32,4,power_law_1.01,0.030559998750686646
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,4096,14336,2,8,32,4,balanced,0.05005866785844167
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,4096,14336,2,8,32,4,power_law_1.01,0.03816959857940674
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,4096,14336,2,8,32,4,power_law_1.01,0.032358399033546446
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,4096,14336,2,8,32,4,power_law_1.01,0.043110400438308716
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,4096,14336,2,8,32,4,power_law_1.01,0.033030399680137636
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,4096,14336,2,8,32,4,power_law_1.01,0.038201600313186646
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,4096,14336,2,8,32,4,power_law_1.01,0.03521279990673065
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,4096,14336,2,8,32,4,power_law_1.01,0.03776639997959137
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,4096,14336,2,8,32,4,power_law_1.01,0.03375999927520752
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,4096,14336,2,8,32,4,power_law_1.01,0.037887999415397645
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,4096,14336,2,8,32,4,balanced,0.06277866661548615
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,4096,14336,2,8,32,4,power_law_1.01,0.03496319949626923
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,4096,14336,2,8,32,4,power_law_1.01,0.03938559889793396
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,4096,14336,2,8,32,4,power_law_1.01,0.034585601091384886
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,4096,14336,2,8,32,4,power_law_1.01,0.04120959937572479
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,4096,14336,2,8,32,4,power_law_1.01,0.034892800450325015
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,4096,14336,2,8,32,4,power_law_1.01,0.0406464010477066
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,4096,14336,2,8,32,4,power_law_1.01,0.03606399893760681
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,4096,14336,2,8,32,4,balanced,0.07685333490371704
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,4096,14336,2,8,32,4,power_law_1.01,0.03782399892807007
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,4096,14336,2,8,32,4,power_law_1.01,0.048844799399375916
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,4096,14336,2,8,32,4,power_law_1.01,0.03861120045185089
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,4096,14336,2,8,32,4,power_law_1.01,0.0383679986000061
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,4096,14336,2,8,32,4,power_law_1.01,0.05834239721298218
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,4096,14336,2,8,32,4,power_law_1.01,0.038975998759269714
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,4096,14336,2,8,32,4,power_law_1.01,0.05984640121459961
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,4096,14336,2,8,32,4,power_law_1.01,0.04121600091457367
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,4096,14336,2,8,32,4,power_law_1.01,0.042854401469230655
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,4096,14336,2,8,32,4,balanced,0.10241066416104634
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,4096,14336,2,8,32,4,power_law_1.01,0.07311999797821045
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,4096,14336,2,8,32,4,power_law_1.01,0.04782719910144806
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,4096,14336,2,8,32,4,power_law_1.01,0.050329601764678954
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,4096,14336,2,8,32,4,power_law_1.01,0.09159039855003356
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,4096,14336,2,8,32,4,power_law_1.01,0.05320320129394531
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,4096,14336,2,8,32,4,power_law_1.01,0.09192960262298584
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,4096,14336,2,8,32,4,power_law_1.01,0.06762880086898804
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,4096,14336,2,8,32,4,power_law_1.01,0.10699520111083985
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,4096,14336,2,8,32,4,power_law_1.01,0.08122239708900451
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,4096,14336,2,8,32,4,balanced,0.1230560044447581
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,4096,14336,2,8,32,4,power_law_1.01,0.10318080186843873
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,4096,14336,2,8,32,4,power_law_1.01,0.11361919641494751
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,4096,14336,2,8,32,4,power_law_1.01,0.11029119491577148
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,4096,14336,2,8,32,4,balanced,0.18720000982284546
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,4096,14336,2,8,32,4,power_law_1.01,0.16669440269470215
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,4096,14336,2,8,32,4,power_law_1.01,0.15790079832077025
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,4096,14336,2,8,32,4,power_law_1.01,0.19133440256118775
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,4096,14336,2,8,32,4,power_law_1.01,0.14991999864578248
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,4096,14336,2,8,32,4,power_law_1.01,0.24036478996276855
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,4096,14336,2,8,32,4,power_law_1.01,0.025593599677085875
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,4096,14336,2,8,32,4,balanced,0.2461386720339457
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,4096,14336,2,8,32,4,power_law_1.01,0.32169599533081056
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,4096,14336,2,8,32,4,power_law_1.01,0.2267712116241455
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,4096,14336,2,8,32,4,power_law_1.01,0.4471615791320801
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,4096,14336,2,8,32,4,power_law_1.01,0.024928000569343568
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,4096,14336,2,8,32,4,power_law_1.01,0.3638783931732178
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,4096,14336,2,8,32,4,power_law_1.01,0.5630911827087403
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,4096,14336,2,8,32,4,balanced,0.3575466473897298
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,4096,14336,2,8,32,4,power_law_1.01,0.024966399371623992
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,4096,14336,2,8,32,4,power_law_1.01,0.3642240047454834
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,4096,14336,2,8,32,4,power_law_1.01,0.8921792030334472
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,4096,14336,2,8,32,4,power_law_1.01,1.317024040222168
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,4096,14336,2,8,32,4,power_law_1.01,0.027161601185798644
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,4096,14336,2,8,32,4,power_law_1.01,0.5059775829315185
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,4096,14336,2,8,32,4,power_law_1.01,3.131167984008789
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,4096,14336,2,8,32,4,power_law_1.01,0.027577599883079527
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,4096,14336,2,8,32,4,power_law_1.01,0.7045504093170166
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,4096,14336,2,8,32,4,balanced,0.4675840139389038
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,4096,14336,2,8,32,4,power_law_1.01,0.02824319899082184
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,4096,14336,2,8,32,4,power_law_1.01,1.2507200241088867
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,4096,14336,2,8,32,4,power_law_1.01,0.028832000494003297
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,4096,14336,2,8,32,4,power_law_1.01,2.537727928161621
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,4096,14336,2,8,32,4,power_law_1.01,0.029919999837875366
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,4096,14336,2,8,32,4,balanced,0.577450672785441
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,4096,14336,2,8,32,4,power_law_1.01,0.03121280074119568
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,4096,14336,2,8,32,4,power_law_1.01,0.03276160061359405
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,4096,14336,2,8,32,4,power_law_1.2,0.03289600014686585
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,4096,14336,2,8,32,4,balanced,0.9020480314890543
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,4096,14336,2,8,32,4,power_law_1.01,0.03792639970779419
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,4096,14336,2,8,32,4,power_law_1.2,0.028972798585891725
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,4096,14336,2,8,32,4,power_law_1.01,0.03701759874820709
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,4096,14336,2,8,32,4,power_law_1.2,0.028697600960731505
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,4096,14336,2,8,32,4,power_law_1.2,0.030483201146125793
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,4096,14336,2,8,32,4,power_law_1.01,0.043647998571395875
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,4096,14336,2,8,32,4,power_law_1.01,0.04459519982337952
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,4096,14336,2,8,32,4,power_law_1.2,0.03047040104866028
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,4096,14336,2,8,32,4,power_law_1.2,0.037011200189590455
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,4096,14336,2,8,32,4,power_law_1.2,0.04145280122756958
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,4096,14336,2,8,32,4,power_law_1.01,0.04849919974803925
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,4096,14336,2,8,32,4,power_law_1.2,0.03824639916419983
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,4096,14336,2,8,32,4,balanced,1.7872053782145183
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,4096,14336,2,8,32,4,power_law_1.01,0.05484799742698669
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,4096,14336,2,8,32,4,power_law_1.2,0.03820799887180328
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,4096,14336,2,8,32,4,power_law_1.01,0.0636031985282898
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,4096,14336,2,8,32,4,power_law_1.2,0.03777920007705689
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,4096,14336,2,8,32,4,power_law_1.2,0.04097920060157776
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,4096,14336,2,8,32,4,power_law_1.01,0.0732800006866455
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,4096,14336,2,8,32,4,power_law_1.2,0.04181120097637177
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,4096,14336,2,8,32,4,power_law_1.01,0.09603840112686157
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,4096,14336,2,8,32,4,power_law_1.2,0.04336000084877014
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,4096,14336,2,8,32,4,power_law_1.2,0.054099202156066895
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,4096,14336,2,8,32,4,power_law_1.2,0.03383679986000061
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,4096,14336,2,8,32,4,power_law_1.01,0.11114879846572875
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,4096,14336,2,8,32,4,power_law_1.2,0.061926400661468504
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,4096,14336,2,8,32,4,power_law_1.2,0.034067198634147644
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,4096,14336,2,8,32,4,power_law_1.2,0.06850559711456299
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,4096,14336,2,8,32,4,power_law_1.01,0.1624127984046936
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,4096,14336,2,8,32,4,power_law_1.2,0.03617919981479645
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,4096,14336,2,8,32,4,power_law_1.2,0.0658623993396759
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,4096,14336,2,8,32,4,power_law_1.2,0.025536000728607178
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,4096,14336,2,8,32,4,power_law_1.2,0.03394559919834137
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,4096,14336,2,8,32,4,power_law_1.2,0.08520960211753845
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,4096,14336,2,8,32,4,power_law_1.01,0.23594241142272948
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,4096,14336,2,8,32,4,power_law_1.2,0.024915200471878052
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,6144,16384,2,8,16,8,balanced,0.050581331054369606
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,4096,14336,2,8,32,4,power_law_1.2,0.034841600060462954
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,4096,14336,2,8,32,4,power_law_1.2,0.09475839734077454
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,4096,14336,2,8,32,4,power_law_1.2,0.025017601251602174
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,4096,14336,2,8,32,4,power_law_1.2,0.03461759984493255
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,6144,16384,2,8,16,8,balanced,0.04528533418973287
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,4096,14336,2,8,32,4,power_law_1.01,0.24097919464111328
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,4096,14336,2,8,32,4,power_law_1.2,0.11275520324707031
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,4096,14336,2,8,32,4,power_law_1.2,0.02723200023174286
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,4096,14336,2,8,32,4,power_law_1.2,0.03527680039405823
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,6144,16384,2,8,16,8,balanced,0.045007998744646706
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,4096,14336,2,8,32,4,power_law_1.01,0.4720320224761963
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,4096,14336,2,8,32,4,power_law_1.2,0.1110975980758667
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,4096,14336,2,8,32,4,power_law_1.2,0.027244800329208375
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,4096,14336,2,8,32,4,power_law_1.2,0.036025598645210266
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,6144,16384,2,8,16,8,balanced,0.046613335609436035
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,4096,14336,2,8,32,4,power_law_1.01,0.5988671779632568
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,4096,14336,2,8,32,4,power_law_1.2,0.1713152050971985
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,4096,14336,2,8,32,4,power_law_1.2,0.02808319926261902
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,6144,16384,2,8,16,8,balanced,0.047040000557899475
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,4096,14336,2,8,32,4,power_law_1.2,0.03760640025138855
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,4096,14336,2,8,32,4,power_law_1.01,0.7970816135406494
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,4096,14336,2,8,32,4,power_law_1.2,0.029497599601745604
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,4096,14336,2,8,32,4,power_law_1.2,0.15163520574569703
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,6144,16384,2,8,16,8,balanced,0.04776533444722494
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,4096,14336,2,8,32,4,power_law_1.2,0.038873600959777835
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,4096,14336,2,8,32,4,power_law_1.2,0.029791998863220214
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,4096,14336,2,8,32,4,power_law_1.01,1.0310336112976075
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,4096,14336,2,8,32,4,power_law_1.2,0.2784320116043091
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,6144,16384,2,8,16,8,balanced,0.04784533381462097
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,4096,14336,2,8,32,4,power_law_1.2,0.039103999733924866
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,4096,14336,2,8,32,4,power_law_1.2,0.03028480112552643
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,4096,14336,2,8,32,4,power_law_1.01,1.174995231628418
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,4096,14336,2,8,32,4,power_law_1.2,0.2832319974899292
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,6144,16384,2,8,16,8,balanced,0.04433600107828776
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,4096,14336,2,8,32,4,power_law_1.2,0.03984639942646027
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,4096,14336,2,8,32,4,power_law_1.2,0.03230080008506775
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,4096,14336,2,8,32,4,power_law_1.2,0.5524735927581788
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,4096,14336,2,8,32,4,power_law_1.01,2.1540416717529296
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,6144,16384,2,8,16,8,balanced,0.04343999922275543
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,4096,14336,2,8,32,4,power_law_1.2,0.0417279988527298
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,4096,14336,2,8,32,4,power_law_1.2,0.629798412322998
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,6144,16384,2,8,16,8,balanced,0.04481600224971771
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,4096,14336,2,8,32,4,power_law_1.01,4.706566238403321
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,4096,14336,2,8,32,4,power_law_1.2,0.042719998955726625
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,4096,14336,2,8,32,4,power_law_1.2,0.037868800759315493
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,4096,14336,2,8,32,4,power_law_1.2,1.0016575813293458
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,4096,14336,2,8,32,4,power_law_1.2,0.052153599262237546
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,6144,16384,2,8,16,8,balanced,0.044437333941459656
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,4096,14336,2,8,32,4,power_law_1.2,0.041606399416923526
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,4096,14336,2,8,32,4,power_law_1.2,1.4489215850830077
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,4096,14336,2,8,32,4,power_law_1.2,0.05056639909744263
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,6144,16384,2,8,16,8,balanced,0.047653332352638245
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,4096,14336,2,8,32,4,power_law_1.2,0.03857919871807099
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,4096,14336,2,8,32,4,power_law_1.2,2.3790399551391603
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,4096,14336,2,8,32,4,power_law_1.2,0.05041279792785645
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,6144,16384,2,8,16,8,balanced,0.04828266799449921
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,4096,14336,2,8,32,4,power_law_1.2,0.04599680006504059
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,4096,14336,2,8,32,4,power_law_1.2,0.06408320069313049
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,6144,16384,2,8,16,8,balanced,0.04744533201058706
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,4096,14336,2,8,32,4,power_law_1.2,0.0760320007801056
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,6144,16384,2,8,16,8,balanced,0.05319466690222422
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,4096,14336,2,8,32,4,power_law_1.2,0.05028480291366577
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,4096,14336,2,8,32,4,power_law_1.2,0.10818560123443603
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,6144,16384,2,8,16,8,balanced,0.05493866900602976
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,4096,14336,2,8,32,4,power_law_1.2,0.05735679864883423
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,4096,14336,2,8,32,4,power_law_1.2,0.11920000314712524
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,4096,14336,2,8,32,4,power_law_1.2,0.06629760265350342
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,6144,16384,2,8,16,8,balanced,0.05579199890295664
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,4096,14336,2,8,32,4,power_law_1.2,0.16594560146331788
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,6144,16384,2,8,16,8,balanced,0.06149866680304209
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,4096,14336,2,8,32,4,power_law_1.2,0.2039423942565918
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,4096,14336,2,8,32,4,power_law_1.2,0.07152000069618225
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,6144,16384,2,8,16,8,balanced,0.06333866715431213
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,4096,14336,2,8,32,4,power_law_1.2,0.25868799686431887
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,4096,14336,2,8,32,4,power_law_1.2,0.091430401802063
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,6144,16384,2,8,16,8,balanced,0.07321600119272868
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,4096,14336,2,8,32,4,power_law_1.2,0.3666111946105957
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,6144,16384,2,8,16,8,balanced,0.07502399881680806
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,4096,14336,2,8,32,4,power_law_1.2,0.5015999794006347
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,4096,14336,2,8,32,4,power_law_1.2,0.10877439975738526
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,6144,16384,2,8,16,8,balanced,0.1090613305568695
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,4096,14336,2,8,32,4,power_law_1.2,0.6848063945770264
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,6144,16384,2,8,16,8,balanced,0.10693333546320598
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,4096,14336,2,8,32,4,power_law_1.2,0.8233856201171875
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,4096,14336,2,8,32,4,power_law_1.2,0.16159360408782958
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,4096,14336,2,8,32,4,power_law_1.2,1.3057600021362306
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,6144,16384,2,8,16,8,balanced,0.0397173340121905
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,6144,16384,2,8,16,8,balanced,0.16381333271662393
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,4096,14336,2,8,32,4,power_law_1.2,2.973868751525879
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,4096,14336,2,8,32,4,power_law_1.2,0.22945280075073243
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,6144,16384,2,8,16,8,balanced,0.039647998909155525
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,6144,16384,2,8,16,8,balanced,0.17974400520324707
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,6144,16384,2,8,16,8,balanced,0.039701332648595176
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,4096,14336,2,8,32,4,power_law_1.2,0.28679680824279785
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,6144,16384,2,8,16,8,balanced,0.04012266546487808
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,4096,14336,2,8,32,4,power_law_1.2,0.5156608104705811
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,6144,16384,2,8,16,8,balanced,0.2588533361752828
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,6144,16384,2,8,16,8,balanced,0.04161066561937332
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,4096,14336,2,8,32,4,power_law_1.2,0.6755904197692871
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,6144,16384,2,8,16,8,balanced,0.04271466533342997
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,4096,14336,2,8,32,4,power_law_1.2,0.8419391632080078
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,6144,16384,2,8,16,8,balanced,0.32099199295043945
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,6144,16384,2,8,16,8,balanced,0.04316799839337667
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,4096,14336,2,8,32,4,power_law_1.2,1.1628543853759765
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,6144,16384,2,8,16,8,balanced,0.042303999265034996
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,4096,14336,2,8,32,4,power_law_1.2,1.3808128356933593
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,6144,16384,2,8,16,8,balanced,0.04271999994913737
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,6144,16384,2,8,16,8,balanced,0.42846934000651044
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,4096,14336,2,8,32,4,power_law_1.2,2.2773887634277346
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,6144,16384,2,8,16,8,balanced,0.042912001411120095
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,6144,16384,2,8,16,8,balanced,0.03939733405907949
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,4096,14336,2,8,32,4,power_law_1.2,5.146470260620117
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,6144,16384,2,8,16,8,balanced,0.040522667268911995
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,6144,16384,2,8,16,8,balanced,0.0418453315893809
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,6144,16384,2,8,16,8,balanced,0.6186186472574869
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,6144,16384,2,8,16,8,balanced,0.04182399809360504
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,6144,16384,2,8,16,8,balanced,0.04776533444722494
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,6144,16384,2,8,16,8,balanced,0.02888533224662145
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,6144,16384,2,8,16,8,balanced,0.05050666630268097
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,6144,16384,2,8,16,8,balanced,0.028688001135985058
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,6144,16384,2,8,16,8,balanced,0.049695998430252075
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,6144,16384,2,8,16,8,balanced,0.028757333755493164
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,6144,16384,2,8,16,8,balanced,0.06107733150323232
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,6144,16384,2,8,16,8,balanced,0.030239999294281006
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,6144,16384,2,8,16,8,balanced,0.06592533489068349
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,6144,16384,2,8,16,8,balanced,0.031162666777769726
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,6144,16384,2,8,16,8,balanced,0.08042666812737782
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,6144,16384,2,8,16,8,balanced,0.03130666663249334
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,6144,16384,2,8,16,8,power_law_1.01,0.038464000821113585
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,6144,16384,2,8,16,8,balanced,1.1789440313975017
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,6144,16384,2,8,16,8,balanced,0.031632001201311745
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,6144,16384,2,8,16,8,power_law_1.01,0.04377599954605103
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,6144,16384,2,8,16,8,balanced,0.09015466769536336
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,6144,16384,2,8,16,8,power_law_1.01,0.04410879909992218
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,6144,16384,2,8,16,8,balanced,0.03137599925200144
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,6144,16384,2,8,16,8,power_law_1.01,0.04567680060863495
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,6144,16384,2,8,16,8,balanced,0.12619733810424805
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,6144,16384,2,8,16,8,power_law_1.01,0.045926401019096376
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,6144,16384,2,8,16,8,balanced,0.03164266546567281
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,6144,16384,2,8,16,8,power_law_1.01,0.053504002094268796
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,6144,16384,2,8,16,8,balanced,0.14246400197347006
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,6144,16384,2,8,16,8,balanced,0.03278400003910065
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,6144,16384,2,8,16,8,power_law_1.01,0.05861759781837463
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,6144,16384,2,8,16,8,power_law_1.01,0.047628799080848695
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,6144,16384,2,8,16,8,balanced,0.20269866784413657
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,6144,16384,2,8,16,8,power_law_1.01,0.04757120013237
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,6144,16384,2,8,16,8,power_law_1.01,0.05055360198020935
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,6144,16384,2,8,16,8,power_law_1.01,0.050944000482559204
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,6144,16384,2,8,16,8,balanced,0.24131200710932413
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,6144,16384,2,8,16,8,power_law_1.01,0.06501759886741638
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,6144,16384,2,8,16,8,balanced,0.0321066677570343
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,6144,16384,2,8,16,8,power_law_1.01,0.0673088014125824
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,6144,16384,2,8,16,8,power_law_1.01,0.06911360025405884
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,6144,16384,2,8,16,8,balanced,0.03271466741959254
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,6144,16384,2,8,16,8,power_law_1.01,0.0889792025089264
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,6144,16384,2,8,16,8,balanced,0.3494986693064372
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,6144,16384,2,8,16,8,power_law_1.01,0.09175040125846863
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,6144,16384,2,8,16,8,balanced,0.03399466723203659
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,6144,16384,2,8,16,8,power_law_1.01,0.0864960014820099
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,6144,16384,2,8,16,8,balanced,0.032501332461833954
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,6144,16384,2,8,16,8,power_law_1.01,0.1054527997970581
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,6144,16384,2,8,16,8,power_law_1.01,0.11277439594268798
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,6144,16384,2,8,16,8,balanced,0.44040000438690186
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,6144,16384,2,8,16,8,power_law_1.01,0.1415295958518982
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,6144,16384,2,8,16,8,power_law_1.01,0.1739776015281677
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,6144,16384,2,8,16,8,power_law_1.01,0.2605056047439575
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,6144,16384,2,8,16,8,power_law_1.01,0.27937281131744385
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,6144,16384,2,8,16,8,balanced,0.041050667564074196
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,6144,16384,2,8,16,8,balanced,0.5599733193715414
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,6144,16384,2,8,16,8,power_law_1.01,0.4306943893432617
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,6144,16384,2,8,16,8,power_law_1.01,0.5292543888092041
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,6144,16384,2,8,16,8,balanced,0.04065600037574768
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,6144,16384,2,8,16,8,power_law_1.01,0.7901887893676758
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,6144,16384,2,8,16,8,balanced,0.04126933217048645
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,6144,16384,2,8,16,8,power_law_1.01,1.0683839797973633
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,6144,16384,2,8,16,8,power_law_1.01,1.2131967544555664
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,6144,16384,2,8,16,8,balanced,0.8522186279296875
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,6144,16384,2,8,16,8,power_law_1.01,2.0733951568603515
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,6144,16384,2,8,16,8,power_law_1.01,3.943257522583008
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,6144,16384,2,8,16,8,power_law_1.01,0.03863680064678192
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,6144,16384,2,8,16,8,balanced,0.04960533479849497
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,6144,16384,2,8,16,8,power_law_1.01,0.039110401272773744
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,6144,16384,2,8,16,8,balanced,0.053455998500188194
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,6144,16384,2,8,16,8,power_law_1.01,0.0392767995595932
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,6144,16384,2,8,16,8,power_law_1.01,0.04023039937019348
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,6144,16384,2,8,16,8,power_law_1.01,0.02837119996547699
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,6144,16384,2,8,16,8,power_law_1.01,0.04023680090904236
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,6144,16384,2,8,16,8,balanced,1.6482666333516438
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,6144,16384,2,8,16,8,power_law_1.01,0.04154880046844482
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,6144,16384,2,8,16,8,power_law_1.01,0.028198400139808656
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,6144,16384,2,8,16,8,power_law_1.01,0.028537601232528687
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,6144,16384,2,8,16,8,power_law_1.01,0.04129279851913452
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,6144,16384,2,8,16,8,balanced,0.0682666649421056
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,6144,16384,2,8,16,8,power_law_1.01,0.030444800853729248
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,6144,16384,2,8,16,8,power_law_1.01,0.0412992000579834
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,6144,16384,2,8,16,8,power_law_1.01,0.030611199140548707
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,6144,16384,2,8,16,8,power_law_1.01,0.041503998637199405
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,6144,16384,2,8,16,8,power_law_1.01,0.03084160089492798
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,6144,16384,2,8,16,8,power_law_1.01,0.042752000689506534
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,6144,16384,2,8,16,8,balanced,0.07769600053628285
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,6144,16384,2,8,16,8,power_law_1.01,0.03402239978313446
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,6144,16384,2,8,16,8,power_law_1.01,0.04302079975605011
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,6144,16384,2,8,16,8,power_law_1.01,0.03495680093765259
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,6144,16384,2,8,16,8,power_law_1.01,0.044710400700569156
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,6144,16384,2,8,16,8,power_law_1.01,0.03504000008106232
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,6144,16384,2,8,16,8,power_law_1.01,0.046988800168037415
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,6144,16384,2,8,16,8,balanced,0.10076266527175903
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,6144,16384,2,8,16,8,power_law_1.01,0.03684479892253876
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,6144,16384,2,8,16,8,power_law_1.2,0.0384768009185791
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,6144,16384,2,8,16,8,power_law_1.01,0.057734400033950806
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,6144,16384,2,8,16,8,balanced,0.12169599533081055
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,6144,16384,2,8,16,8,power_law_1.01,0.06744319796562195
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,6144,16384,2,8,16,8,power_law_1.2,0.03852800130844116
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,6144,16384,2,8,16,8,power_law_1.01,0.07445120215415954
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,6144,16384,2,8,16,8,power_law_1.2,0.03842560052871704
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,6144,16384,2,8,16,8,power_law_1.01,0.04310399889945984
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,6144,16384,2,8,16,8,power_law_1.01,0.06857600212097167
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,6144,16384,2,8,16,8,power_law_1.2,0.03935360014438629
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,6144,16384,2,8,16,8,power_law_1.01,0.04789760112762451
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,6144,16384,2,8,16,8,power_law_1.01,0.09080320000648498
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,6144,16384,2,8,16,8,power_law_1.2,0.04015359878540039
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,6144,16384,2,8,16,8,power_law_1.01,0.05189759731292724
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,6144,16384,2,8,16,8,balanced,0.17706666390101114
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,6144,16384,2,8,16,8,power_law_1.01,0.09720320105552674
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,6144,16384,2,8,16,8,power_law_1.2,0.05729920268058777
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,6144,16384,2,8,16,8,power_law_1.01,0.06691200137138367
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,6144,16384,2,8,16,8,power_law_1.01,0.12836480140686035
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,6144,16384,2,8,16,8,power_law_1.2,0.06046720147132874
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,6144,16384,2,8,16,8,balanced,0.22537599007288614
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,6144,16384,2,8,16,8,power_law_1.01,0.1506880044937134
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,6144,16384,2,8,16,8,power_law_1.2,0.04728319942951202
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,6144,16384,2,8,16,8,power_law_1.01,0.06438400149345398
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,6144,16384,2,8,16,8,power_law_1.2,0.04885759949684143
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,6144,16384,2,8,16,8,balanced,0.34136001269022626
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,6144,16384,2,8,16,8,power_law_1.01,0.2050879955291748
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,6144,16384,2,8,16,8,power_law_1.01,0.06937599778175355
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,6144,16384,2,8,16,8,power_law_1.2,0.049772799015045166
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,6144,16384,2,8,16,8,power_law_1.01,0.2481152057647705
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,6144,16384,2,8,16,8,power_law_1.01,0.09360640048980713
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,6144,16384,2,8,16,8,power_law_1.2,0.051583999395370485
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,6144,16384,2,8,16,8,power_law_1.01,0.35498239994049074
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,6144,16384,2,8,16,8,balanced,0.44485334555308026
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,6144,16384,2,8,16,8,power_law_1.2,0.06222720146179199
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,6144,16384,2,8,16,8,power_law_1.01,0.47994241714477537
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,6144,16384,2,8,16,8,power_law_1.2,0.06435199975967407
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,6144,16384,2,8,16,8,power_law_1.01,0.09991040229797363
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,6144,16384,2,8,16,8,power_law_1.2,0.06940159797668458
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,6144,16384,2,8,16,8,power_law_1.2,0.038841599225997926
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,6144,16384,2,8,16,8,power_law_1.01,0.6959936141967773
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,6144,16384,2,8,16,8,power_law_1.01,0.12524800300598143
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,6144,16384,2,8,16,8,balanced,0.5473066568374634
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,6144,16384,2,8,16,8,power_law_1.2,0.09317119717597962
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,6144,16384,2,8,16,8,power_law_1.01,0.9188672065734863
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,6144,16384,2,8,16,8,power_law_1.2,0.038764798641204835
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,6144,16384,2,8,16,8,power_law_1.2,0.08644480109214783
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,6144,16384,2,8,16,8,power_law_1.2,0.039340800046920775
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,6144,16384,2,8,16,8,power_law_1.01,1.158835220336914
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,6144,16384,2,8,16,8,power_law_1.01,0.1534719944000244
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,6144,16384,2,8,16,8,power_law_1.2,0.08673920035362244
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,6144,16384,2,8,16,8,power_law_1.2,0.04013440012931824
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,6144,16384,2,8,16,8,power_law_1.2,0.11368319988250733
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,6144,16384,2,8,16,8,power_law_1.01,1.860371208190918
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,6144,16384,2,8,16,8,power_law_1.2,0.04066559970378876
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,6144,16384,2,8,16,8,balanced,0.8601493040720621
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,6144,16384,2,8,16,8,power_law_1.01,0.19841279983520507
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,6144,16384,2,8,16,8,power_law_1.2,0.10638079643249512
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,6144,16384,2,8,16,8,power_law_1.2,0.041484799981117246
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,6144,16384,2,8,16,8,power_law_1.01,3.3057151794433595
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,6144,16384,2,8,16,8,power_law_1.2,0.14927999973297118
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,6144,16384,2,8,16,8,power_law_1.2,0.04108799993991852
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,6144,16384,2,8,16,8,power_law_1.01,0.29322240352630613
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,6144,16384,2,8,16,8,power_law_1.2,0.18344320058822633
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,6144,16384,2,8,16,8,power_law_1.2,0.04172160029411316
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,6144,16384,2,8,16,8,power_law_1.01,0.3273344039916992
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,6144,16384,2,8,16,8,power_law_1.2,0.26686079502105714
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,6144,16384,2,8,16,8,power_law_1.2,0.042208001017570496
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,6144,16384,2,8,16,8,power_law_1.2,0.29161601066589354
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,6144,16384,2,8,16,8,power_law_1.2,0.04354560077190399
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,6144,16384,2,8,16,8,power_law_1.01,0.5775680065155029
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,6144,16384,2,8,16,8,power_law_1.2,0.3863552093505859
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,6144,16384,2,8,16,8,power_law_1.2,0.0438975989818573
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,6144,16384,2,8,16,8,power_law_1.2,0.028377598524093627
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,6144,16384,2,8,16,8,power_law_1.01,0.6877439975738525
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,6144,16384,2,8,16,8,balanced,1.6998880704243977
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,6144,16384,2,8,16,8,power_law_1.2,0.5260608196258545
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,6144,16384,2,8,16,8,power_law_1.2,0.044838398694992065
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,6144,16384,2,8,16,8,power_law_1.2,0.028300800919532777
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,6144,16384,2,8,16,8,power_law_1.01,1.087168025970459
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,6144,16384,2,8,16,8,power_law_1.2,0.048102399706840514
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,6144,16384,2,8,16,8,power_law_1.2,0.7926911830902099
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,6144,16384,2,8,16,8,power_law_1.2,0.028601598739624024
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,6144,16384,2,8,16,8,power_law_1.01,1.4325504302978516
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,6144,16384,2,8,16,8,power_law_1.2,0.05869439840316772
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,6144,16384,2,8,16,8,power_law_1.2,1.006822395324707
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,6144,16384,2,8,16,8,power_law_1.2,0.030188798904418945
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,6144,16384,2,8,16,8,power_law_1.01,1.655731201171875
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,6144,16384,2,8,16,8,power_law_1.2,0.07011200189590454
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,6144,16384,2,8,16,8,power_law_1.2,1.2734911918640137
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,6144,16384,2,8,16,8,power_law_1.2,0.03059839904308319
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,6144,16384,2,8,16,8,power_law_1.2,0.07210879921913146
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,6144,16384,2,8,16,8,power_law_1.01,2.935296058654785
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,6144,16384,2,8,16,8,power_law_1.2,2.1928192138671876
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,6144,16384,2,8,16,8,power_law_1.2,0.03110400140285492
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,6144,16384,2,8,16,8,power_law_1.2,0.06903039813041686
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,6144,16384,2,8,16,8,power_law_1.2,0.033881598711013795
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,6144,16384,2,8,16,8,power_law_1.01,5.620851135253906
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,6144,16384,2,8,16,8,power_law_1.2,3.9851070404052735
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,6144,16384,2,8,16,8,power_law_1.2,0.08728960156440735
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,6144,16384,2,8,16,8,power_law_1.2,0.03495039939880371
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,6144,16384,2,8,16,8,power_law_1.2,0.09827839732170104
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,6144,16384,2,8,16,8,power_law_1.2,0.035308799147605895
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,6144,16384,2,8,16,8,power_law_1.2,0.13063039779663085
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,6144,16384,2,8,16,8,power_law_1.2,0.037478399276733396
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,6144,16384,2,8,16,8,power_law_1.2,0.15443840026855468
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,6144,16384,2,8,16,8,power_law_1.2,0.21396479606628419
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,6144,16384,2,8,16,8,power_law_1.2,0.04038400053977966
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,6144,16384,2,8,16,8,power_law_1.2,0.2551487922668457
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,6144,16384,2,8,16,8,power_law_1.2,0.051571202278137204
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,6144,16384,2,8,16,8,power_law_1.2,0.35189759731292725
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,6144,16384,2,8,16,8,power_law_1.2,0.0535103976726532
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,6144,16384,2,8,16,8,power_law_1.2,0.46910080909729
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,6144,16384,2,8,32,4,balanced,0.039077334105968475
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,6144,16384,2,8,16,8,power_law_1.2,0.06675840020179749
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,6144,16384,2,8,16,8,power_law_1.2,0.7213888168334961
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,6144,16384,2,8,32,4,balanced,0.03925866633653641
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,6144,16384,2,8,32,4,balanced,0.04418133199214935
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,6144,16384,2,8,16,8,power_law_1.2,0.9333056449890137
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,6144,16384,2,8,32,4,balanced,0.04580800235271454
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,6144,16384,2,8,32,4,balanced,0.046538665890693665
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,6144,16384,2,8,16,8,power_law_1.2,0.06687359809875489
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,6144,16384,2,8,32,4,balanced,0.04683733483155569
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,6144,16384,2,8,16,8,power_law_1.2,1.198796844482422
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,6144,16384,2,8,16,8,power_law_1.2,0.06989439725875854
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,6144,16384,2,8,32,4,balanced,0.047242666284243263
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,6144,16384,2,8,16,8,power_law_1.2,0.09234560132026673
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,6144,16384,2,8,16,8,power_law_1.2,1.8864191055297852
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,6144,16384,2,8,32,4,balanced,0.048512001832326256
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,6144,16384,2,8,32,4,balanced,0.046853333711624146
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,6144,16384,2,8,32,4,balanced,0.04786133269468943
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,6144,16384,2,8,16,8,power_law_1.2,3.398764801025391
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,6144,16384,2,8,32,4,balanced,0.04530133306980133
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,6144,16384,2,8,16,8,power_law_1.2,0.09823359847068787
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,6144,16384,2,8,32,4,balanced,0.03519999980926514
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,6144,16384,2,8,32,4,balanced,0.046906664967536926
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,6144,16384,2,8,16,8,power_law_1.2,0.12868479490280152
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,6144,16384,2,8,32,4,balanced,0.04717333118120829
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,6144,16384,2,8,32,4,balanced,0.03540800015131632
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,6144,16384,2,8,32,4,balanced,0.04970133304595947
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,6144,16384,2,8,32,4,balanced,0.05830933153629303
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,6144,16384,2,8,32,4,balanced,0.041589332123597465
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,6144,16384,2,8,32,4,balanced,0.04197866717974345
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,6144,16384,2,8,32,4,balanced,0.05923733115196228
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,6144,16384,2,8,16,8,power_law_1.2,0.1708351969718933
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,6144,16384,2,8,32,4,balanced,0.05866666634877523
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,6144,16384,2,8,32,4,balanced,0.04276266694068909
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,6144,16384,2,8,32,4,balanced,0.06548800071080525
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,6144,16384,2,8,32,4,balanced,0.03808533400297165
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,6144,16384,2,8,16,8,power_law_1.2,0.2161407947540283
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,6144,16384,2,8,32,4,balanced,0.06772799789905548
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,6144,16384,2,8,32,4,balanced,0.03817066550254822
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,6144,16384,2,8,16,8,power_law_1.2,0.3130687952041626
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,6144,16384,2,8,32,4,balanced,0.08483200271924336
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,6144,16384,2,8,32,4,balanced,0.03834133346875509
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,6144,16384,2,8,16,8,power_law_1.2,0.34967041015625
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,6144,16384,2,8,32,4,balanced,0.03876800090074539
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,6144,16384,2,8,32,4,balanced,0.0940106709798177
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,6144,16384,2,8,32,4,balanced,0.03976533313592275
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,6144,16384,2,8,32,4,balanced,0.11220266421635945
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,6144,16384,2,8,16,8,power_law_1.2,0.5155136108398437
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,6144,16384,2,8,32,4,balanced,0.04635733366012573
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,6144,16384,2,8,32,4,balanced,0.13617066542307535
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,6144,16384,2,8,16,8,power_law_1.2,0.6234879970550538
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,6144,16384,2,8,32,4,balanced,0.045941332976023354
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,6144,16384,2,8,32,4,balanced,0.19962666432062784
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,6144,16384,2,8,16,8,power_law_1.2,1.080179214477539
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,6144,16384,2,8,32,4,balanced,0.04637333254019419
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,6144,16384,2,8,32,4,balanced,0.04287999868392944
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,6144,16384,2,8,32,4,balanced,0.214410662651062
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,6144,16384,2,8,16,8,power_law_1.2,1.463411235809326
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,6144,16384,2,8,32,4,balanced,0.04862933357556661
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,6144,16384,2,8,16,8,power_law_1.2,1.6121152877807616
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,6144,16384,2,8,32,4,balanced,0.04938133557637533
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,6144,16384,2,8,32,4,balanced,0.33242134253184
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,6144,16384,2,8,16,8,power_law_1.2,2.782035255432129
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,6144,16384,2,8,32,4,balanced,0.05296533306439718
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,6144,16384,2,8,16,8,power_law_1.2,5.794591903686523
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,6144,16384,2,8,32,4,balanced,0.3933279911677043
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,6144,16384,2,8,32,4,balanced,0.06235733131567637
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,6144,16384,2,8,32,4,balanced,0.07069866855939229
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,6144,16384,2,8,32,4,balanced,0.08769599596659343
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,6144,16384,2,8,32,4,balanced,0.5119466781616211
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,6144,16384,2,8,32,4,balanced,0.10419199864069621
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,6144,16384,2,8,32,4,balanced,0.13300800323486328
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,6144,16384,2,8,32,4,balanced,0.1604213317235311
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,6144,16384,2,8,32,4,balanced,0.7563146750132242
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,6144,16384,2,8,32,4,balanced,0.22901866833368936
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,6144,16384,2,8,32,4,balanced,0.276256004969279
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,6144,16384,2,8,32,4,balanced,0.3944053252538045
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,6144,16384,2,8,32,4,balanced,1.441381295522054
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,6144,16384,2,8,32,4,balanced,0.5085066556930542
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,6144,16384,2,8,32,4,balanced,0.028570666909217834
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,6144,16384,2,8,32,4,balanced,0.6403306722640991
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,6144,16384,2,8,32,4,balanced,0.028368001182874043
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,6144,16384,2,8,32,4,balanced,0.029077333708604176
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,6144,16384,2,8,32,4,power_law_1.01,0.04483200013637543
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,6144,16384,2,8,32,4,balanced,0.030453334252039593
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,6144,16384,2,8,32,4,balanced,0.03143466760714849
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,6144,16384,2,8,32,4,power_law_1.01,0.04322560131549835
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,6144,16384,2,8,32,4,balanced,0.9838133653004965
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,6144,16384,2,8,32,4,balanced,0.031717332700888314
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,6144,16384,2,8,32,4,power_law_1.01,0.043084800243377686
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,6144,16384,2,8,32,4,balanced,0.03236266722281774
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,6144,16384,2,8,32,4,power_law_1.01,0.045561599731445315
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,6144,16384,2,8,32,4,power_law_1.01,0.0458624005317688
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,6144,16384,2,8,32,4,balanced,0.03219733387231827
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,6144,16384,2,8,32,4,power_law_1.01,0.05505920052528381
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,6144,16384,2,8,32,4,power_law_1.01,0.035366401076316833
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,6144,16384,2,8,32,4,power_law_1.01,0.06165760159492493
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,6144,16384,2,8,32,4,balanced,0.03254933406909307
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,6144,16384,2,8,32,4,power_law_1.01,0.03603839874267578
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,6144,16384,2,8,32,4,power_law_1.01,0.05059199929237366
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,6144,16384,2,8,32,4,balanced,0.0335413341720899
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,6144,16384,2,8,32,4,power_law_1.01,0.0379967987537384
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,6144,16384,2,8,32,4,power_law_1.01,0.051148802042007446
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,6144,16384,2,8,32,4,power_law_1.01,0.04196479916572571
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,6144,16384,2,8,32,4,power_law_1.01,0.028908801078796387
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,6144,16384,2,8,32,4,balanced,2.0175093015034995
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,6144,16384,2,8,32,4,power_law_1.01,0.052179199457168576
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,6144,16384,2,8,32,4,power_law_1.01,0.04232960045337677
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,6144,16384,2,8,32,4,power_law_1.01,0.02847360074520111
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,6144,16384,2,8,32,4,power_law_1.01,0.05002880096435547
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,6144,16384,2,8,32,4,power_law_1.01,0.038790398836135866
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,6144,16384,2,8,32,4,power_law_1.01,0.028262400627136232
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,6144,16384,2,8,32,4,power_law_1.01,0.05454720258712768
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,6144,16384,2,8,32,4,balanced,0.033402666449546814
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,6144,16384,2,8,32,4,power_law_1.01,0.03934719860553741
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,6144,16384,2,8,32,4,power_law_1.01,0.03059200048446655
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,6144,16384,2,8,32,4,power_law_1.01,0.051820802688598636
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,6144,16384,2,8,32,4,balanced,0.03427733232577642
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,6144,16384,2,8,32,4,power_law_1.01,0.040403199195861814
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,6144,16384,2,8,32,4,power_law_1.01,0.0310591995716095
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,6144,16384,2,8,32,4,power_law_1.01,0.06502400040626526
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,6144,16384,2,8,32,4,power_law_1.01,0.04105600118637085
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,6144,16384,2,8,32,4,balanced,0.03598399957021078
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,6144,16384,2,8,32,4,power_law_1.01,0.03329919874668121
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,6144,16384,2,8,32,4,power_law_1.01,0.07886080145835876
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,6144,16384,2,8,32,4,power_law_1.01,0.040863999724388124
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,6144,16384,2,8,32,4,balanced,0.03565333286921183
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,6144,16384,2,8,32,4,power_law_1.01,0.03441280126571655
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,6144,16384,2,8,32,4,power_law_1.01,0.08552320003509521
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,6144,16384,2,8,32,4,power_law_1.01,0.04635519981384277
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,6144,16384,2,8,32,4,power_law_1.01,0.03521920144557953
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,6144,16384,2,8,32,4,power_law_1.01,0.04664320051670075
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,6144,16384,2,8,32,4,power_law_1.01,0.07751039862632751
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,6144,16384,2,8,32,4,power_law_1.2,0.04460160136222839
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,6144,16384,2,8,32,4,power_law_1.01,0.10167039632797241
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,6144,16384,2,8,32,4,power_law_1.01,0.04865280091762543
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,6144,16384,2,8,32,4,power_law_1.01,0.03553920090198517
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,6144,16384,2,8,32,4,balanced,0.04355733096599579
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,6144,16384,2,8,32,4,power_law_1.01,0.11388159990310669
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,6144,16384,2,8,32,4,power_law_1.2,0.042694398760795595
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,6144,16384,2,8,32,4,power_law_1.01,0.055961602926254274
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,6144,16384,2,8,32,4,power_law_1.01,0.03771519958972931
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,6144,16384,2,8,32,4,power_law_1.01,0.12739839553833007
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,6144,16384,2,8,32,4,balanced,0.043866669138272606
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,6144,16384,2,8,32,4,power_law_1.2,0.04222719967365265
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,6144,16384,2,8,32,4,power_law_1.01,0.061913597583770755
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,6144,16384,2,8,32,4,balanced,0.04868799944718679
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,6144,16384,2,8,32,4,power_law_1.01,0.15395840406417846
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,6144,16384,2,8,32,4,power_law_1.01,0.06647040247917176
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,6144,16384,2,8,32,4,power_law_1.2,0.04596480131149292
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,6144,16384,2,8,32,4,power_law_1.01,0.04259200096130371
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,6144,16384,2,8,32,4,power_law_1.01,0.07180799841880799
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,6144,16384,2,8,32,4,power_law_1.2,0.04573439955711365
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,6144,16384,2,8,32,4,power_law_1.01,0.2180351972579956
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,6144,16384,2,8,32,4,power_law_1.01,0.04602240025997162
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,6144,16384,2,8,32,4,power_law_1.01,0.08138239979743958
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,6144,16384,2,8,32,4,power_law_1.01,0.32731521129608154
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,6144,16384,2,8,32,4,power_law_1.2,0.060601598024368285
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,6144,16384,2,8,32,4,balanced,0.05919999877611796
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,6144,16384,2,8,32,4,power_law_1.01,0.0468095988035202
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,6144,16384,2,8,32,4,power_law_1.01,0.09144960045814514
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,6144,16384,2,8,32,4,power_law_1.2,0.06195840239524841
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,6144,16384,2,8,32,4,power_law_1.01,0.4794367790222168
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,6144,16384,2,8,32,4,balanced,0.06706133484840393
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,6144,16384,2,8,32,4,power_law_1.01,0.11785600185394288
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,6144,16384,2,8,32,4,power_law_1.01,0.06330239772796631
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,6144,16384,2,8,32,4,power_law_1.2,0.051283198595047
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,6144,16384,2,8,32,4,power_law_1.01,0.5202432155609131
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,6144,16384,2,8,32,4,power_law_1.01,0.142086398601532
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,6144,16384,2,8,32,4,power_law_1.2,0.051072001457214355
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,6144,16384,2,8,32,4,power_law_1.01,0.7260287761688232
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,6144,16384,2,8,32,4,power_law_1.01,0.20344319343566894
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,6144,16384,2,8,32,4,power_law_1.2,0.05178239941596985
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,6144,16384,2,8,32,4,power_law_1.01,0.951296043395996
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,6144,16384,2,8,32,4,balanced,0.08451732993125916
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,6144,16384,2,8,32,4,power_law_1.01,0.05935360193252563
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,6144,16384,2,8,32,4,power_law_1.01,0.27552640438079834
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,6144,16384,2,8,32,4,power_law_1.2,0.05003520250320435
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,6144,16384,2,8,32,4,power_law_1.01,1.4251839637756347
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,6144,16384,2,8,32,4,power_law_1.01,0.06947839856147767
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,6144,16384,2,8,32,4,power_law_1.01,0.4244224071502686
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,6144,16384,2,8,32,4,power_law_1.2,0.05178239941596985
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,6144,16384,2,8,32,4,power_law_1.01,0.08497920036315917
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,6144,16384,2,8,32,4,power_law_1.01,1.7673791885375976
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,6144,16384,2,8,32,4,power_law_1.01,0.46628479957580565
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,6144,16384,2,8,32,4,power_law_1.2,0.05790079832077026
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,6144,16384,2,8,32,4,balanced,0.09983999530474345
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,6144,16384,2,8,32,4,power_law_1.01,0.681766414642334
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,6144,16384,2,8,32,4,power_law_1.01,3.8072830200195313
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,6144,16384,2,8,32,4,power_law_1.2,0.07240319848060608
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,6144,16384,2,8,32,4,power_law_1.01,0.09747200012207032
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,6144,16384,2,8,32,4,power_law_1.01,0.86746244430542
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,6144,16384,2,8,32,4,power_law_1.2,0.07895039916038513
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,6144,16384,2,8,32,4,power_law_1.01,0.11335680484771729
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,6144,16384,2,8,32,4,power_law_1.01,1.1656000137329101
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,6144,16384,2,8,32,4,power_law_1.2,0.08639360070228577
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,6144,16384,2,8,32,4,power_law_1.01,1.8256832122802735
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,6144,16384,2,8,32,4,power_law_1.01,0.15927679538726808
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,6144,16384,2,8,32,4,power_law_1.2,0.08456959724426269
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,6144,16384,2,8,32,4,balanced,0.13563199838002524
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,6144,16384,2,8,32,4,power_law_1.01,4.0578369140625
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,6144,16384,2,8,32,4,power_law_1.2,0.10883200168609619
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,6144,16384,2,8,32,4,power_law_1.01,0.22711679935455323
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,6144,16384,2,8,32,4,balanced,0.17653866608937582
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,6144,16384,2,8,32,4,power_law_1.2,0.10696959495544434
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,6144,16384,2,8,32,4,balanced,0.27056533098220825
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,6144,16384,2,8,32,4,power_law_1.2,0.14714239835739135
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,6144,16384,2,8,32,4,power_law_1.2,0.03640959858894348
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,6144,16384,2,8,32,4,power_law_1.01,0.3191744089126587
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,6144,16384,2,8,32,4,power_law_1.2,0.14596480131149292
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,6144,16384,2,8,32,4,balanced,0.3471946716308594
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,6144,16384,2,8,32,4,power_law_1.2,0.036262398958206175
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,6144,16384,2,8,32,4,power_law_1.01,0.43144960403442384
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,6144,16384,2,8,32,4,power_law_1.2,0.2346112012863159
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,6144,16384,2,8,32,4,power_law_1.2,0.03992320001125336
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,6144,16384,2,8,32,4,power_law_1.01,0.771014404296875
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,6144,16384,2,8,32,4,power_law_1.2,0.3099776029586792
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,6144,16384,2,8,32,4,balanced,0.5052533149719238
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,6144,16384,2,8,32,4,power_law_1.2,0.042828801274299624
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,6144,16384,2,8,32,4,power_law_1.01,0.7417280197143554
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,6144,16384,2,8,32,4,power_law_1.2,0.3999552011489868
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,6144,16384,2,8,32,4,power_law_1.2,0.04211199879646301
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,6144,16384,2,8,32,4,power_law_1.2,0.43614721298217773
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,6144,16384,2,8,32,4,power_law_1.01,1.4690303802490234
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,6144,16384,2,8,32,4,balanced,0.6639626820882162
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,6144,16384,2,8,32,4,power_law_1.01,1.425881576538086
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,6144,16384,2,8,32,4,power_law_1.2,0.038431999087333676
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,6144,16384,2,8,32,4,power_law_1.2,0.6220160007476807
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,6144,16384,2,8,32,4,power_law_1.01,2.0640895843505858
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,6144,16384,2,8,32,4,power_law_1.2,0.039628800749778745
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,6144,16384,2,8,32,4,power_law_1.2,0.9003840446472168
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,6144,16384,2,8,32,4,balanced,0.8243199984232584
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,6144,16384,2,8,32,4,power_law_1.2,0.028812798857688903
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,6144,16384,2,8,32,4,power_law_1.2,0.04044800102710724
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,6144,16384,2,8,32,4,power_law_1.2,1.3309696197509766
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,6144,16384,2,8,32,4,power_law_1.01,3.569209671020508
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,6144,16384,2,8,32,4,power_law_1.2,0.040940800309181215
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,6144,16384,2,8,32,4,power_law_1.2,0.02855679988861084
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,6144,16384,2,8,32,4,power_law_1.2,2.09736328125
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,6144,16384,2,8,32,4,power_law_1.01,5.487347030639649
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,6144,16384,2,8,32,4,power_law_1.2,0.041631999611854556
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,6144,16384,2,8,32,4,power_law_1.2,0.0286080002784729
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,6144,16384,2,8,32,4,power_law_1.2,3.9973377227783202
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,6144,16384,2,8,32,4,power_law_1.2,0.030393600463867188
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,6144,16384,2,8,32,4,power_law_1.2,0.04542079865932465
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,6144,16384,2,8,32,4,balanced,1.3002933661142986
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,6144,16384,2,8,32,4,power_law_1.2,0.03033599853515625
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,6144,16384,2,8,32,4,power_law_1.2,0.04636160135269165
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,6144,16384,2,8,32,4,power_law_1.2,0.03338240087032318
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,6144,16384,2,8,32,4,power_law_1.2,0.04784640073776245
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,6144,16384,2,8,32,4,power_law_1.2,0.033817601203918454
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,6144,16384,2,8,32,4,power_law_1.2,0.052211201190948485
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,6144,16384,2,8,32,4,power_law_1.2,0.03612160086631775
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,6144,16384,2,8,32,4,power_law_1.2,0.06284800171852112
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,6144,16384,2,8,32,4,power_law_1.2,0.06672000288963317
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,6144,16384,2,8,32,4,power_law_1.2,0.03751679956912994
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,6144,16384,2,8,32,4,power_law_1.2,0.06682239770889283
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,6144,16384,2,8,32,4,power_law_1.2,0.0378495991230011
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,6144,16384,2,8,32,4,power_law_1.2,0.08399360179901123
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,6144,16384,2,8,32,4,balanced,2.5869599978129068
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,6144,16384,2,8,32,4,power_law_1.2,0.09432960152626038
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,6144,16384,2,8,32,4,power_law_1.2,0.129203200340271
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,6144,16384,2,8,32,4,power_law_1.2,0.04302720129489899
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,6144,16384,2,8,32,4,power_law_1.2,0.16136319637298585
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,6144,16384,2,8,32,4,power_law_1.2,0.04936319887638092
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,6144,16384,2,8,32,4,power_law_1.2,0.1878335952758789
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,6144,16384,2,8,32,4,power_law_1.2,0.04993920028209686
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,6144,16384,2,8,32,4,power_law_1.2,0.29047040939331054
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,6144,16384,2,8,32,4,power_law_1.2,0.06427519917488098
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,6144,16384,2,8,32,4,power_law_1.2,0.4304448127746582
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,6144,16384,2,8,32,4,power_law_1.2,0.5458240032196044
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,6144,16384,2,8,32,4,power_law_1.2,0.07108479738235474
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,6144,16384,2,8,32,4,power_law_1.2,0.6995200157165528
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,6144,16384,2,8,32,4,power_law_1.2,0.07040640115737914
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,6144,16384,2,8,32,4,power_law_1.2,0.9654399871826171
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,6144,16384,2,8,32,4,power_law_1.2,0.08360959887504578
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,6144,16384,2,8,32,4,power_law_1.2,1.351200008392334
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,6144,16384,2,8,32,4,power_law_1.2,0.10390399694442749
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,6144,16384,2,8,32,4,power_law_1.2,1.8717952728271485
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,6144,16384,2,8,32,4,power_law_1.2,0.1332479953765869
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,6144,16384,2,8,32,4,power_law_1.2,3.9225406646728516
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,6144,16384,2,8,32,4,power_law_1.2,0.1729024052619934
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,6144,16384,2,8,32,4,power_law_1.2,0.2413952112197876
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,6144,16384,2,8,32,4,power_law_1.2,0.3530303955078125
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,6144,16384,2,8,32,4,power_law_1.2,0.4791679859161377
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,6144,16384,2,8,32,4,power_law_1.2,0.7470016002655029
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,6144,16384,2,8,32,4,power_law_1.2,0.893228816986084
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,7168,2048,8,256,1,128,balanced,0.1879840095837911
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,6144,16384,2,8,32,4,power_law_1.2,1.2179903984069824
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,7168,2048,8,256,1,128,balanced,0.1851093371709188
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,7168,2048,8,256,1,128,balanced,0.186298668384552
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,6144,16384,2,8,32,4,power_law_1.2,1.8887104034423827
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,7168,2048,8,256,1,128,balanced,0.1898826758066813
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,6144,16384,2,8,32,4,power_law_1.2,2.199967956542969
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,7168,2048,8,256,1,128,balanced,0.19484267632166544
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,7168,2048,8,256,1,128,balanced,0.3511893351872762
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,6144,16384,2,8,32,4,power_law_1.2,3.0930559158325197
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,7168,2048,8,256,1,128,balanced,0.3626720110575358
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,7168,2048,8,256,1,128,balanced,0.35930665334065753
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,6144,16384,2,8,32,4,power_law_1.2,7.9102531433105465
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,7168,2048,8,256,1,128,balanced,0.34229334195454914
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,7168,2048,8,256,1,128,balanced,0.34585599104563397
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,7168,2048,8,256,1,128,balanced,0.35806934038798016
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,7168,2048,8,256,1,128,balanced,0.3482293287913005
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,7168,2048,8,256,1,128,balanced,0.3460853497187297
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,7168,2048,8,256,1,128,balanced,0.35440532366434735
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,7168,2048,8,256,1,128,balanced,0.37693333625793457
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,7168,2048,8,256,1,128,balanced,0.37293867270151776
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,7168,2048,8,256,1,128,balanced,0.32791467507680255
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,7168,2048,8,256,1,128,balanced,0.34489067395528156
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,7168,2048,8,256,1,128,balanced,0.33828266461690265
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,7168,2048,8,256,1,128,balanced,0.33739201227823895
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,7168,2048,8,256,1,128,balanced,0.32893866300582886
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,7168,2048,8,256,1,128,balanced,0.11731200416882832
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,7168,2048,8,256,1,128,balanced,0.29436800877253216
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,7168,2048,8,256,1,128,balanced,0.116565336783727
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,7168,2048,8,256,1,128,balanced,0.11690133810043335
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,7168,2048,8,256,1,128,balanced,0.1216266651948293
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,7168,2048,8,256,1,128,balanced,0.11567999919255574
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,7168,2048,8,256,1,128,balanced,0.24772799015045166
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,7168,2048,8,256,1,128,balanced,0.20665599902470908
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,7168,2048,8,256,1,128,balanced,0.20002132654190063
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,7168,2048,8,256,1,128,balanced,0.20110932985941568
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,7168,2048,8,256,1,128,balanced,0.21741867065429688
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,7168,2048,8,256,1,128,balanced,0.5428373416264852
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,7168,2048,8,256,1,128,balanced,0.2055573264757792
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,7168,2048,8,256,1,128,balanced,0.21053866545359293
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,7168,2048,8,256,1,128,balanced,0.21955732504526773
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,7168,2048,8,256,1,128,balanced,0.2146079937616984
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,7168,2048,8,256,1,128,balanced,0.19917333126068115
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,7168,2048,8,256,1,128,balanced,0.44226133823394775
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,7168,2048,8,256,1,128,balanced,0.048351998130480446
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,7168,2048,8,256,1,128,balanced,0.20972800254821777
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,7168,2048,8,256,1,128,balanced,0.04854399959246317
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,7168,2048,8,256,1,128,balanced,0.21396267414093018
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,7168,2048,8,256,1,128,balanced,0.04887466629346212
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,7168,2048,8,256,1,128,balanced,0.05308799942334493
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,7168,2048,8,256,1,128,balanced,0.21519466241200766
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,7168,2048,8,256,1,128,balanced,0.052202666799227394
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,7168,2048,8,256,1,128,balanced,0.22344533602396646
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,7168,2048,8,256,1,128,balanced,0.06454400221506755
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,7168,2048,8,256,1,128,balanced,0.06592533489068349
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,7168,2048,8,256,1,128,balanced,0.21452265977859497
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,7168,2048,8,256,1,128,balanced,0.06675200164318085
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,7168,2048,8,256,1,128,balanced,0.6385546525319418
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,7168,2048,8,256,1,128,balanced,0.06669866542021434
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,7168,2048,8,256,1,128,balanced,0.2355253299077352
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,7168,2048,8,256,1,128,balanced,0.067071999112765
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,7168,2048,8,256,1,128,balanced,0.06840000053246816
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,7168,2048,8,256,1,128,balanced,0.24093866348266602
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,7168,2048,8,256,1,128,balanced,0.06869866450627644
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,7168,2048,8,256,1,128,balanced,0.0699839989344279
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,7168,2048,8,256,1,128,balanced,0.07069333394368489
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,7168,2048,8,256,1,128,balanced,0.25334932406743366
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,7168,2048,8,256,1,128,power_law_1.01,0.2096127986907959
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,7168,2048,8,256,1,128,balanced,0.0759093314409256
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,7168,2048,8,256,1,128,power_law_1.01,0.33678719997406004
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,7168,2048,8,256,1,128,balanced,0.07675733168919881
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,7168,2048,8,256,1,128,power_law_1.01,0.19761919975280762
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,7168,2048,8,256,1,128,balanced,0.07969066500663757
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,7168,2048,8,256,1,128,balanced,0.2566666603088379
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,7168,2048,8,256,1,128,balanced,0.8291520277659098
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,7168,2048,8,256,1,128,power_law_1.01,0.17694079875946045
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,7168,2048,8,256,1,128,power_law_1.01,0.3452735900878906
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,7168,2048,8,256,1,128,power_law_1.01,0.17271679639816284
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,7168,2048,8,256,1,128,power_law_1.01,0.3042815923690796
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,7168,2048,8,256,1,128,power_law_1.01,0.20748798847198485
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,7168,2048,8,256,1,128,balanced,0.08928533395131429
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,7168,2048,8,256,1,128,power_law_1.01,0.36357119083404543
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,7168,2048,8,256,1,128,power_law_1.01,0.2093951940536499
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,7168,2048,8,256,1,128,balanced,0.4526933431625366
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,7168,2048,8,256,1,128,power_law_1.01,0.36392960548400877
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,7168,2048,8,256,1,128,power_law_1.01,0.20753920078277588
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,7168,2048,8,256,1,128,power_law_1.01,0.05942400097846985
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,7168,2048,8,256,1,128,power_law_1.01,0.3537919998168945
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,7168,2048,8,256,1,128,power_law_1.01,0.20416638851165772
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,7168,2048,8,256,1,128,power_law_1.01,0.35567359924316405
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,7168,2048,8,256,1,128,power_law_1.01,0.05813760161399841
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,7168,2048,8,256,1,128,power_law_1.01,0.20625920295715333
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,7168,2048,8,256,1,128,power_law_1.01,0.05484799742698669
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,7168,2048,8,256,1,128,power_law_1.01,0.35306239128112793
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,7168,2048,8,256,1,128,balanced,0.4545919895172119
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,7168,2048,8,256,1,128,power_law_1.01,0.20088319778442382
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,256,1,128,balanced,0.094842662413915
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,7168,2048,8,256,1,128,power_law_1.01,0.06154879927635193
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,7168,2048,8,256,1,128,balanced,1.0198079744974773
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,7168,2048,8,256,1,128,power_law_1.01,0.3481343984603882
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,7168,2048,8,256,1,128,power_law_1.01,0.19973119497299194
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,7168,2048,8,256,1,128,power_law_1.01,0.06451200246810913
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,7168,2048,8,256,1,128,power_law_1.01,0.19630719423294068
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,256,1,128,balanced,0.10972799857457478
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,7168,2048,8,256,1,128,power_law_1.01,0.3439487934112549
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,7168,2048,8,256,1,128,power_law_1.01,0.06449919939041138
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,7168,2048,8,256,1,128,power_law_1.01,0.19667199850082398
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,7168,2048,8,256,1,128,power_law_1.01,0.33923840522766113
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,256,1,128,balanced,0.12083199620246887
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,7168,2048,8,256,1,128,power_law_1.01,0.19371520280838012
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,7168,2048,8,256,1,128,power_law_1.01,0.06531199812889099
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,7168,2048,8,256,1,128,power_law_1.01,0.33593599796295165
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,7168,2048,8,256,1,128,power_law_1.01,0.19342080354690552
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,7168,2048,8,256,1,128,power_law_1.01,0.06639360189437866
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,7168,2048,8,256,1,128,balanced,0.654858668645223
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,7168,2048,8,256,1,128,power_law_1.01,0.33127679824829104
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,7168,2048,8,256,1,128,power_law_1.01,0.18754559755325317
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,7168,2048,8,256,1,128,power_law_1.01,0.0664192020893097
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,7168,2048,8,256,1,128,power_law_1.01,0.32108159065246583
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,7168,2048,8,256,1,128,power_law_1.01,0.17333760261535644
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,7168,2048,8,256,1,128,power_law_1.01,0.0674560010433197
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,7168,2048,8,256,1,128,power_law_1.01,0.31483519077301025
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,7168,2048,8,256,1,128,power_law_1.01,0.19993599653244018
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,7168,2048,8,256,1,128,power_law_1.01,0.07279360294342041
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,7168,2048,8,256,1,128,power_law_1.01,0.3124671936035156
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,7168,2048,8,256,1,128,power_law_1.01,0.25813119411468505
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,7168,2048,8,256,1,128,power_law_1.01,0.07504000067710877
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,7168,2048,8,256,1,128,power_law_1.2,0.33794560432434084
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,256,1,128,balanced,0.14893333117167154
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,7168,2048,8,256,1,128,power_law_1.01,0.27482879161834717
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,7168,2048,8,256,1,128,power_law_1.01,0.3015872001647949
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,7168,2048,8,256,1,128,power_law_1.01,0.07500799894332885
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,7168,2048,8,256,1,128,power_law_1.2,0.34473600387573244
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,7168,2048,8,256,1,128,power_law_1.01,0.08798720240592957
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,7168,2048,8,256,1,128,power_law_1.01,0.3349184036254883
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,7168,2048,8,256,1,128,power_law_1.01,0.3721920013427734
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,256,1,128,balanced,0.17241066694259644
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,7168,2048,8,256,1,128,power_law_1.2,0.24478719234466553
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,7168,2048,8,256,1,128,balanced,0.8521973292032877
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,7168,2048,8,256,1,128,power_law_1.01,0.0939520001411438
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,7168,2048,8,256,1,128,power_law_1.01,0.4655168056488037
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,7168,2048,8,256,1,128,power_law_1.01,0.39838080406188964
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,7168,2048,8,256,1,128,balanced,1.6184693972269695
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,7168,2048,8,256,1,128,power_law_1.2,0.33050880432128904
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,7168,2048,8,256,1,128,power_law_1.01,0.09964159727096558
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,7168,2048,8,256,1,128,power_law_1.01,0.6458623886108399
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,7168,2048,8,256,1,128,power_law_1.01,0.4729856014251709
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,7168,2048,8,256,1,128,power_law_1.2,0.35433599948883054
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,7168,2048,8,256,1,128,power_law_1.01,0.11230720281600952
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,7168,2048,8,256,1,128,power_law_1.01,0.9652095794677734
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,256,1,128,balanced,0.2308853268623352
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,7168,2048,8,256,1,128,power_law_1.01,0.6450751781463623
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,7168,2048,8,256,1,128,power_law_1.2,0.3424000024795532
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,7168,2048,8,256,1,128,power_law_1.01,1.062342357635498
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,7168,2048,8,256,1,128,power_law_1.01,0.7445631980895996
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,7168,2048,8,256,1,128,power_law_1.01,0.14022400379180908
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,7168,2048,8,256,1,128,power_law_1.2,0.368012809753418
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,7168,2048,8,256,1,128,power_law_1.01,1.7316608428955078
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,7168,2048,8,256,1,128,power_law_1.01,0.973203182220459
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,7168,2048,8,256,1,128,power_law_1.2,0.3419903993606567
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,7168,2048,8,256,1,128,power_law_1.01,2.335468864440918
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,256,1,128,balanced,0.2792053421338399
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,7168,2048,8,256,1,128,power_law_1.01,1.1521984100341798
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,7168,2048,8,256,1,128,power_law_1.2,0.34815359115600586
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,256,1,128,power_law_1.01,0.13633279800415038
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,7168,2048,8,256,1,128,power_law_1.01,2.9470144271850587
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,7168,2048,8,256,1,128,power_law_1.01,1.7598207473754883
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,7168,2048,8,256,1,128,power_law_1.2,0.3461440086364746
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,256,1,128,power_law_1.01,0.18065279722213745
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,7168,2048,8,256,1,128,balanced,1.0512479941050212
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,7168,2048,8,256,1,128,power_law_1.2,0.3355391979217529
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,256,1,128,power_law_1.01,0.22128000259399414
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,7168,2048,8,256,1,128,power_law_1.01,2.422054481506348
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,7168,2048,8,256,1,128,power_law_1.01,5.047878265380859
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,7168,2048,8,256,1,128,power_law_1.2,0.3336575984954834
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,7168,2048,8,256,1,128,power_law_1.01,4.413228988647461
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,7168,2048,8,256,1,128,power_law_1.2,0.3197695970535278
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,7168,2048,8,256,1,128,power_law_1.01,9.613069152832031
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,256,1,128,power_law_1.01,0.2835968017578125
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,7168,2048,8,256,1,128,power_law_1.01,4.698041534423828
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,7168,2048,8,256,1,128,power_law_1.2,0.31626238822937014
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,256,1,128,power_law_1.01,0.40035200119018555
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,7168,2048,8,256,1,128,power_law_1.2,0.31083519458770753
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,256,1,128,balanced,0.3964266777038574
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,256,1,128,power_law_1.01,0.502675199508667
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,7168,2048,8,256,1,128,power_law_1.01,7.934623718261719
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,7168,2048,8,256,1,128,power_law_1.2,0.2629055976867676
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,256,1,128,power_law_1.01,0.6737792015075683
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,7168,2048,8,256,1,128,power_law_1.2,0.3446784019470215
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,7168,2048,8,256,1,128,power_law_1.2,0.2041856050491333
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,7168,2048,8,256,1,128,power_law_1.01,18.701190185546874
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,7168,2048,8,256,1,128,power_law_1.2,0.3284991979598999
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,256,1,128,power_law_1.01,1.050598430633545
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,7168,2048,8,256,1,128,power_law_1.2,0.19660799503326415
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,7168,2048,8,256,1,128,power_law_1.2,0.5428287982940674
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,256,1,128,power_law_1.01,1.3324159622192382
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,7168,2048,8,256,1,128,power_law_1.2,0.14570239782333375
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,7168,2048,8,256,1,128,power_law_1.2,0.5593023777008057
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,256,1,128,balanced,0.505184014638265
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,7168,2048,8,256,1,128,power_law_1.2,0.20071039199829102
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,7168,2048,8,256,1,128,power_law_1.2,0.7279295921325684
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,7168,2048,8,256,1,128,balanced,1.6489013036092122
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,7168,2048,8,256,1,128,power_law_1.2,0.1872063994407654
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,7168,2048,8,256,1,128,power_law_1.2,1.0712063789367676
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,256,1,128,power_law_1.01,1.9321151733398438
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,7168,2048,8,256,1,128,power_law_1.2,0.1976256012916565
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,7168,2048,8,256,1,128,power_law_1.2,1.4691264152526855
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,256,1,128,power_law_1.01,2.985203170776367
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,7168,2048,8,256,1,128,power_law_1.2,0.1992576003074646
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,7168,2048,8,256,1,128,power_law_1.2,2.1448896408081053
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,7168,2048,8,256,1,128,balanced,3.3149598439534507
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,7168,2048,8,256,1,128,power_law_1.2,0.20222079753875732
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,256,1,128,power_law_1.01,5.5185791015625
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,7168,2048,8,256,1,128,power_law_1.2,3.2906368255615233
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,7168,2048,8,256,1,128,power_law_1.2,0.20166399478912353
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,7168,2048,8,256,1,128,power_law_1.2,4.577004623413086
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,7168,2048,8,256,1,128,power_law_1.2,0.2020927906036377
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,7168,2048,8,256,1,128,power_law_1.2,0.195251202583313
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,7168,2048,8,256,1,128,power_law_1.2,6.288870239257813
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,256,1,128,balanced,0.6345173517862955
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,7168,2048,8,256,1,128,power_law_1.2,0.1943743944168091
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,7168,2048,8,256,1,128,power_law_1.2,8.640652465820313
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,7168,2048,8,256,1,128,power_law_1.2,0.18804479837417604
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,7168,2048,8,256,1,128,power_law_1.2,0.19400320053100586
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,7168,2048,8,256,1,128,power_law_1.2,13.967814636230468
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,7168,2048,8,256,1,128,power_law_1.2,0.17875200510025024
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,7168,2048,8,256,1,128,power_law_1.2,0.18227839469909668
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,7168,2048,8,256,1,128,power_law_1.2,0.20855679512023925
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,7168,2048,8,256,1,128,power_law_1.2,35.85335693359375
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,7168,2048,8,256,1,128,power_law_1.2,0.24652159214019775
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,7168,2048,8,256,1,128,power_law_1.2,0.2895103931427002
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,7168,2048,8,256,1,128,power_law_1.2,0.3619136095046997
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,7168,2048,8,256,1,128,power_law_1.2,0.46561279296875
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,256,1,128,balanced,0.9758826891581217
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,7168,2048,8,256,1,128,power_law_1.2,0.6297279834747315
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,7168,2048,8,256,1,128,power_law_1.2,0.784287977218628
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,7168,2048,8,256,1,128,power_law_1.2,1.1945152282714844
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,7168,2048,8,256,1,128,balanced,3.278261184692383
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,7168,2048,8,256,1,128,power_law_1.2,1.6022207260131835
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,7168,2048,8,256,1,128,power_law_1.2,2.353785514831543
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,7168,2048,8,256,1,128,power_law_1.2,3.7874687194824217
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,7168,2048,8,256,1,128,power_law_1.2,4.581401443481445
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,7168,2048,8,256,1,128,power_law_1.2,8.582265472412109
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,7168,2048,8,256,1,128,power_law_1.2,20.48005065917969
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,256,1,128,balanced,1.9806079864501953
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,7168,2048,8,256,1,128,power_law_1.2,0.06120960116386413
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,7168,2048,8,256,1,128,power_law_1.2,0.05852159857749939
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,7168,2048,8,256,1,128,power_law_1.2,0.05095040202140808
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,7168,2048,8,256,2,64,balanced,0.10919466614723206
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,7168,2048,8,256,1,128,power_law_1.2,0.06392319798469544
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,7168,2048,8,256,2,64,balanced,0.11115200320879619
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,7168,2048,8,256,1,128,power_law_1.2,0.06375679969787598
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,7168,2048,8,256,2,64,balanced,0.10937066872914632
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,7168,2048,8,256,2,64,balanced,0.1146453320980072
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,7168,2048,8,256,1,128,power_law_1.2,0.06515200138092041
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,7168,2048,8,256,2,64,balanced,0.19875200589497885
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,7168,2048,8,256,1,128,power_law_1.2,0.06575359702110291
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,7168,2048,8,256,2,64,balanced,0.35837864875793457
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,7168,2048,8,256,1,128,power_law_1.2,0.06663680076599121
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,7168,2048,8,256,2,64,balanced,0.3739573160807292
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,7168,2048,8,256,1,128,power_law_1.2,0.06710399985313416
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,7168,2048,8,256,2,64,balanced,0.36602667967478436
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,7168,2048,8,256,1,128,power_law_1.2,0.06801279783248901
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,7168,2048,8,256,2,64,balanced,0.37881600856781006
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,7168,2048,8,256,1,128,power_law_1.2,0.07394559979438782
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,7168,2048,8,256,2,64,balanced,0.3468746741612752
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,7168,2048,8,256,2,64,balanced,0.0764160007238388
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,7168,2048,8,256,2,64,balanced,0.39558398723602295
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,7168,2048,8,256,1,128,power_law_1.2,0.07570559978485107
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,7168,2048,8,256,2,64,balanced,0.0776693324247996
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,7168,2048,8,256,2,64,balanced,0.36857601006825763
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,7168,2048,8,256,1,128,power_law_1.2,0.0818560004234314
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,7168,2048,8,256,2,64,balanced,0.07874666651089986
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,7168,2048,8,256,2,64,balanced,0.3899679978688558
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,7168,2048,8,256,1,128,power_law_1.2,0.09266560077667237
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,7168,2048,8,256,2,64,balanced,0.07970133423805237
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,7168,2048,8,256,2,64,balanced,0.35865068435668945
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,7168,2048,8,256,1,128,power_law_1.2,0.09670400023460388
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,7168,2048,8,256,2,64,balanced,0.12388799587885539
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,7168,2048,8,256,2,64,power_law_1.01,0.3539072036743164
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,7168,2048,8,256,2,64,balanced,0.38114134470621747
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,7168,2048,8,256,2,64,balanced,0.21466133991877237
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,7168,2048,8,256,1,128,power_law_1.2,0.10370559692382812
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,7168,2048,8,256,2,64,power_law_1.01,0.35841920375823977
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,7168,2048,8,256,2,64,balanced,0.3622293472290039
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,7168,2048,8,256,2,64,balanced,0.21411732832590738
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,7168,2048,8,256,1,128,power_law_1.2,0.12527999877929688
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,7168,2048,8,256,2,64,power_law_1.01,0.29506559371948243
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,7168,2048,8,256,2,64,balanced,0.33243733644485474
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,7168,2048,8,256,2,64,balanced,0.21819200118382773
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,7168,2048,8,256,2,64,power_law_1.01,0.21072640419006347
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,7168,2048,8,256,2,64,balanced,0.043696001172065735
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,7168,2048,8,256,2,64,power_law_1.01,0.2381824016571045
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,7168,2048,8,256,2,64,balanced,0.21620267629623413
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,7168,2048,8,256,1,128,power_law_1.2,0.15720959901809692
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,7168,2048,8,256,2,64,balanced,0.37492799758911133
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,7168,2048,8,256,2,64,power_law_1.01,0.31191039085388184
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,7168,2048,8,256,2,64,balanced,0.044309332966804504
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,7168,2048,8,256,2,64,balanced,0.2075200080871582
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,7168,2048,8,256,2,64,power_law_1.01,0.34993278980255127
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,7168,2048,8,256,2,64,balanced,0.3455040057500203
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,7168,2048,8,256,2,64,balanced,0.04422399898370107
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,7168,2048,8,256,2,64,balanced,0.2152693271636963
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,7168,2048,8,256,2,64,power_law_1.01,0.3687936067581177
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,7168,2048,8,256,2,64,balanced,0.04756266872088114
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,7168,2048,8,256,2,64,balanced,0.22080000241597494
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,256,1,128,power_law_1.2,0.15242880582809448
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,7168,2048,8,256,2,64,power_law_1.01,0.3600127935409546
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,7168,2048,8,256,2,64,balanced,0.33880531787872314
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,7168,2048,8,256,2,64,power_law_1.01,0.3657151937484741
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,7168,2048,8,256,2,64,balanced,0.05327466626962026
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,7168,2048,8,256,2,64,balanced,0.22207466761271158
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,256,1,128,power_law_1.2,0.22835841178894042
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,7168,2048,8,256,2,64,power_law_1.01,0.3470400094985962
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,7168,2048,8,256,2,64,balanced,0.0652159998814265
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,7168,2048,8,256,2,64,balanced,0.33192533254623413
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,7168,2048,8,256,2,64,balanced,0.2066239913304647
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,256,1,128,power_law_1.2,0.2937855958938599
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,7168,2048,8,256,2,64,power_law_1.01,0.33422720432281494
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,7168,2048,8,256,2,64,balanced,0.06628266473611195
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,7168,2048,8,256,2,64,balanced,0.22219200929005942
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,7168,2048,8,256,2,64,power_law_1.01,0.34150400161743166
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,7168,2048,8,256,2,64,balanced,0.06727999945481618
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,7168,2048,8,256,2,64,power_law_1.01,0.33024001121520996
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,7168,2048,8,256,2,64,balanced,0.2227039933204651
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,7168,2048,8,256,2,64,balanced,0.30509867270787555
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,7168,2048,8,256,2,64,balanced,0.06712000072002411
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,7168,2048,8,256,2,64,power_law_1.01,0.35238399505615237
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,256,1,128,power_law_1.2,0.37160320281982423
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,7168,2048,8,256,2,64,balanced,0.21533334255218506
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,7168,2048,8,256,2,64,power_law_1.01,0.3074624061584473
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,7168,2048,8,256,2,64,balanced,0.06770666440327962
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,256,1,128,power_law_1.2,0.5044288158416748
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,7168,2048,8,256,2,64,power_law_1.01,0.31432960033416746
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,7168,2048,8,256,2,64,balanced,0.2172213395436605
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,7168,2048,8,256,2,64,balanced,0.06892266869544983
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,7168,2048,8,256,2,64,balanced,0.2592586676279704
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,7168,2048,8,256,2,64,power_law_1.01,0.3610559940338135
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,256,1,128,power_law_1.2,0.650707197189331
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,7168,2048,8,256,2,64,balanced,0.06927466889222463
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,7168,2048,8,256,2,64,power_law_1.01,0.35900800228118895
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,7168,2048,8,256,2,64,power_law_1.01,0.21594879627227784
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,7168,2048,8,256,2,64,balanced,0.23414933681488037
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,256,1,128,power_law_1.2,1.0020544052124023
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,7168,2048,8,256,2,64,balanced,0.07101866602897644
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,7168,2048,8,256,2,64,power_law_1.01,0.4548287868499756
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,7168,2048,8,256,2,64,power_law_1.01,0.21578240394592285
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,7168,2048,8,256,2,64,power_law_1.01,0.5269887924194336
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,7168,2048,8,256,2,64,balanced,0.2413706580797831
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,7168,2048,8,256,2,64,balanced,0.07171200215816498
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,7168,2048,8,256,2,64,balanced,0.5492639938990275
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,7168,2048,8,256,2,64,power_law_1.01,0.7291903972625733
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,256,1,128,power_law_1.2,1.6611520767211914
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,7168,2048,8,256,2,64,power_law_1.01,0.20838398933410646
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,7168,2048,8,256,2,64,balanced,0.07655466596285503
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,7168,2048,8,256,2,64,power_law_1.01,0.786790418624878
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,7168,2048,8,256,2,64,balanced,0.2502346634864807
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,7168,2048,8,256,2,64,power_law_1.01,0.1343616008758545
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,7168,2048,8,256,2,64,balanced,0.07858133316040039
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,256,1,128,power_law_1.2,2.2030399322509764
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,7168,2048,8,256,2,64,power_law_1.01,1.1726911544799805
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,7168,2048,8,256,2,64,power_law_1.01,0.16647679805755616
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,7168,2048,8,256,2,64,balanced,0.0811359981695811
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,7168,2048,8,256,2,64,power_law_1.01,1.3982527732849122
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,7168,2048,8,256,2,64,balanced,0.2640906572341919
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,7168,2048,8,256,2,64,power_law_1.01,2.1747648239135744
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,7168,2048,8,256,2,64,power_law_1.01,0.18336639404296876
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,256,1,128,power_law_1.2,2.4428863525390625
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,7168,2048,8,256,2,64,balanced,0.45899732907613117
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,7168,2048,8,256,2,64,power_law_1.01,2.711903953552246
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,7168,2048,8,256,2,64,power_law_1.01,0.1903807997703552
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,256,1,128,power_law_1.2,4.112390518188477
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,7168,2048,8,256,2,64,balanced,0.0925386647383372
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,7168,2048,8,256,2,64,power_law_1.01,3.3487934112548827
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,7168,2048,8,256,2,64,balanced,0.2695840001106262
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,7168,2048,8,256,2,64,power_law_1.01,0.2133375883102417
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,7168,2048,8,256,2,64,power_law_1.01,0.19197440147399902
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,7168,2048,8,256,2,64,power_law_1.01,5.576921463012695
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,7168,2048,8,256,2,64,power_law_1.01,0.06340479850769043
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,256,1,128,power_law_1.2,10.327814483642578
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,7168,2048,8,256,2,64,power_law_1.01,0.18483200073242187
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,7168,2048,8,256,2,64,power_law_1.01,0.060147202014923094
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,7168,2048,8,256,2,64,balanced,0.46480000019073486
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,7168,2048,8,256,2,64,power_law_1.01,14.447602844238281
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,7168,2048,8,256,2,64,power_law_1.01,0.19954559803009034
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,7168,2048,8,256,2,64,balanced,0.6594133377075195
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,7168,2048,8,256,2,64,power_law_1.01,0.05734400153160095
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,7168,2048,8,256,2,64,power_law_1.2,0.35503358840942384
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,7168,2048,8,256,2,64,power_law_1.01,0.2039936065673828
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,7168,2048,8,256,2,64,power_law_1.01,0.055641597509384154
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,256,2,64,balanced,0.0990559955437978
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,7168,2048,8,256,2,64,power_law_1.01,0.2079103946685791
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,7168,2048,8,256,2,64,power_law_1.2,0.3569279909133911
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,7168,2048,8,256,2,64,power_law_1.01,0.06304640173912049
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,7168,2048,8,256,2,64,power_law_1.01,0.1876863956451416
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,256,2,64,balanced,0.11440533399581909
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,7168,2048,8,256,2,64,power_law_1.2,0.15627520084381102
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,7168,2048,8,256,2,64,balanced,0.47520001729329425
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,7168,2048,8,256,2,64,power_law_1.01,0.0636352002620697
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,7168,2048,8,256,2,64,power_law_1.2,0.24977281093597412
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,7168,2048,8,256,2,64,power_law_1.01,0.19377919435501098
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,7168,2048,8,256,2,64,power_law_1.01,0.06464639902114869
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,256,2,64,balanced,0.12651733557383218
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,7168,2048,8,256,2,64,power_law_1.2,0.22455039024353027
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,7168,2048,8,256,2,64,power_law_1.01,0.20625920295715333
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,7168,2048,8,256,2,64,power_law_1.01,0.06805760264396668
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,7168,2048,8,256,2,64,balanced,0.8605066935221354
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,7168,2048,8,256,2,64,power_law_1.2,0.2803967952728271
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,7168,2048,8,256,2,64,power_law_1.01,0.20224640369415284
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,7168,2048,8,256,2,64,power_law_1.01,0.06775680184364319
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,7168,2048,8,256,2,64,power_law_1.2,0.34603519439697267
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,7168,2048,8,256,2,64,power_law_1.01,0.21464319229125978
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,7168,2048,8,256,2,64,power_law_1.01,0.06788480281829834
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,7168,2048,8,256,2,64,balanced,0.681541363398234
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,7168,2048,8,256,2,64,power_law_1.01,0.25824000835418703
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,7168,2048,8,256,2,64,power_law_1.2,0.35697920322418214
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,7168,2048,8,256,2,64,power_law_1.01,0.07215359807014465
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,7168,2048,8,256,2,64,power_law_1.01,0.07365760207176208
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,7168,2048,8,256,2,64,power_law_1.01,0.3219199895858765
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,7168,2048,8,256,2,64,power_law_1.2,0.34065918922424315
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,256,2,64,balanced,0.15904532869656882
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,7168,2048,8,256,2,64,power_law_1.01,0.07730559706687927
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,7168,2048,8,256,2,64,power_law_1.01,0.3441728115081787
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,7168,2048,8,256,2,64,power_law_1.2,0.35243520736694334
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,7168,2048,8,256,2,64,power_law_1.01,0.0819263994693756
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,7168,2048,8,256,2,64,power_law_1.2,0.3576767921447754
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,7168,2048,8,256,2,64,power_law_1.01,0.4705023765563965
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,256,2,64,balanced,0.18458133935928345
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,7168,2048,8,256,2,64,power_law_1.01,0.09152640104293823
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,7168,2048,8,256,2,64,power_law_1.2,0.34717440605163574
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,7168,2048,8,256,2,64,power_law_1.01,0.5600512027740479
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,7168,2048,8,256,2,64,power_law_1.01,0.09648000001907349
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,7168,2048,8,256,2,64,balanced,1.0766773223876953
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,7168,2048,8,256,2,64,power_law_1.01,0.6917376041412353
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,7168,2048,8,256,2,64,power_law_1.2,0.3527744054794312
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,7168,2048,8,256,2,64,balanced,0.8866133689880371
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,7168,2048,8,256,2,64,power_law_1.01,0.10444159507751465
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,7168,2048,8,256,2,64,power_law_1.01,0.9367487907409668
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,7168,2048,8,256,2,64,power_law_1.2,0.3152575969696045
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,256,2,64,balanced,0.2510400017102559
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,7168,2048,8,256,2,64,power_law_1.2,0.3181632041931152
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,7168,2048,8,256,2,64,power_law_1.01,0.1287935972213745
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,7168,2048,8,256,2,64,power_law_1.01,1.426969623565674
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,7168,2048,8,256,2,64,power_law_1.2,0.29073920249938967
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,7168,2048,8,256,2,64,power_law_1.01,1.7472000122070312
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,7168,2048,8,256,2,64,power_law_1.2,0.3336704015731812
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,256,2,64,power_law_1.01,0.1298815965652466
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,256,2,64,balanced,0.3044640024503072
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,7168,2048,8,256,2,64,power_law_1.01,2.436128044128418
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,7168,2048,8,256,2,64,power_law_1.2,0.40192642211914065
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,256,2,64,power_law_1.01,0.17239680290222167
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,7168,2048,8,256,2,64,power_law_1.01,4.013977432250977
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,256,2,64,power_law_1.01,0.20980479717254638
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,7168,2048,8,256,2,64,power_law_1.2,0.4171135902404785
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,7168,2048,8,256,2,64,balanced,1.0948320229848225
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,7168,2048,8,256,2,64,power_law_1.2,0.5655871868133545
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,7168,2048,8,256,2,64,power_law_1.01,8.167993927001953
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,256,2,64,power_law_1.01,0.2566335916519165
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,7168,2048,8,256,2,64,power_law_1.2,0.7293695926666259
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,256,2,64,power_law_1.01,0.34907519817352295
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,7168,2048,8,256,2,64,power_law_1.2,0.8784192085266114
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,7168,2048,8,256,2,64,balanced,1.701456069946289
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,256,2,64,power_law_1.01,0.492083215713501
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,256,2,64,balanced,0.4420479933420817
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,7168,2048,8,256,2,64,power_law_1.2,1.0586048126220704
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,256,2,64,power_law_1.01,0.6241087913513184
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,7168,2048,8,256,2,64,power_law_1.2,1.2968832015991212
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,7168,2048,8,256,2,64,power_law_1.2,1.8849472045898437
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,256,2,64,power_law_1.01,0.9906880378723144
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,7168,2048,8,256,2,64,power_law_1.2,2.9065664291381834
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,256,2,64,power_law_1.01,1.4146623611450195
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,7168,2048,8,256,2,64,power_law_1.2,4.474278259277344
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,256,2,64,balanced,0.5726720094680786
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,7168,2048,8,256,2,64,power_law_1.2,4.489939117431641
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,7168,2048,8,256,2,64,balanced,1.7161919275919597
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,256,2,64,power_law_1.01,1.5812416076660156
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,7168,2048,8,256,2,64,power_law_1.2,10.292460632324218
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,256,2,64,power_law_1.01,2.3982656478881834
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,256,2,64,power_law_1.01,5.191296005249024
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,7168,2048,8,256,2,64,power_law_1.2,22.90142059326172
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,256,2,64,balanced,0.7263946533203125
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,7168,2048,8,256,2,64,balanced,3.502810796101888
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,256,2,64,balanced,1.1107093493143718
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,7168,2048,8,256,2,64,balanced,3.407461484273275
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,7168,2048,8,256,2,64,power_law_1.2,0.21548800468444823
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,7168,2048,8,256,2,64,power_law_1.2,0.21751680374145507
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,7168,2048,8,256,2,64,power_law_1.2,0.12539520263671874
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,7168,2048,8,256,2,64,power_law_1.2,0.1417088031768799
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,7168,2048,8,256,2,64,power_law_1.2,0.14163199663162232
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,7168,2048,8,256,2,64,power_law_1.2,0.18880640268325805
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,7168,2048,8,256,2,64,power_law_1.2,0.06380800008773804
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,7168,2048,8,256,2,64,power_law_1.2,0.2075648069381714
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,7168,2048,8,256,2,64,power_law_1.2,0.2120448112487793
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,7168,2048,8,256,2,64,power_law_1.2,0.06032639741897583
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,7168,2048,8,256,2,64,power_law_1.2,0.1861631989479065
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,7168,2048,8,256,2,64,power_law_1.2,0.048895999789237976
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,7168,2048,8,256,2,64,power_law_1.2,0.19328000545501708
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,7168,2048,8,256,2,64,power_law_1.2,0.2004863977432251
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,7168,2048,8,256,2,64,power_law_1.2,0.05921279788017273
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,7168,2048,8,256,2,64,power_law_1.2,0.19678720235824584
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,7168,2048,8,256,2,64,power_law_1.2,0.059987199306488034
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,7168,2048,8,256,2,64,power_law_1.2,0.20249600410461427
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,256,2,64,balanced,2.2218453089396157
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,7168,2048,8,256,2,64,power_law_1.2,0.18839679956436156
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,7168,2048,8,256,2,64,power_law_1.2,0.059910398721694944
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,7168,2048,8,256,2,64,power_law_1.2,0.18747520446777344
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,7168,2048,8,256,2,64,power_law_1.2,0.06612480282783509
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,7168,2048,8,256,2,64,power_law_1.2,0.20325760841369628
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,7168,2048,8,256,2,64,power_law_1.2,0.1890176057815552
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,7168,2048,8,256,2,64,power_law_1.2,0.06479359865188598
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,7168,2048,8,256,2,64,power_law_1.2,0.2302783966064453
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,7168,2048,8,256,2,64,power_law_1.2,0.06632959842681885
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,7168,2048,8,256,2,64,power_law_1.2,0.2756160020828247
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,7168,2048,8,256,2,64,power_law_1.2,0.06704000234603882
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,7168,2048,8,256,2,64,power_law_1.2,0.3432255983352661
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,7168,2048,8,256,2,64,power_law_1.2,0.43364481925964354
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,7168,2048,8,256,2,64,power_law_1.2,0.07146239876747132
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,7168,2048,8,256,2,64,power_law_1.2,0.5400703907012939
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,7168,2048,8,256,2,64,power_law_1.2,0.07451519966125489
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,7168,2048,8,256,2,64,power_law_1.2,0.7124864101409912
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,7168,2048,8,256,2,64,power_law_1.2,0.07845759987831116
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,7168,2048,8,256,2,64,power_law_1.2,1.006873607635498
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,7168,2048,8,256,2,64,power_law_1.2,1.3051839828491212
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,7168,2048,8,256,2,64,power_law_1.2,0.08370559811592101
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,7168,2048,8,256,2,64,power_law_1.2,1.987424087524414
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,7168,2048,8,256,2,64,power_law_1.2,0.09537280201911927
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,7168,2048,8,256,2,64,power_law_1.2,2.84399356842041
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,7168,2048,8,256,2,64,power_law_1.2,0.09538559913635254
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,7168,2048,8,256,2,64,power_law_1.2,3.5864959716796876
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,7168,2048,8,256,2,64,power_law_1.2,0.11890560388565063
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,7168,2048,8,256,2,64,power_law_1.2,5.853612899780273
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,7168,2048,8,256,2,64,power_law_1.2,0.1371008038520813
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,7168,2048,8,256,2,64,power_law_1.2,13.543878173828125
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,256,2,64,power_law_1.2,0.1515712022781372
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,256,2,64,power_law_1.2,0.19459840059280395
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,7168,2048,8,256,4,32,balanced,0.05606399973233541
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,256,2,64,power_law_1.2,0.2380671977996826
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,7168,2048,8,256,4,32,balanced,0.05597866574923197
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,7168,2048,8,256,4,32,balanced,0.05535466472307841
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,7168,2048,8,256,4,32,balanced,0.062208001812299095
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,256,2,64,power_law_1.2,0.32766079902648926
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,7168,2048,8,256,4,32,balanced,0.06982933481534322
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,7168,2048,8,256,4,32,balanced,0.08717866738637288
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,256,2,64,power_law_1.2,0.4289535999298096
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,7168,2048,8,256,4,32,balanced,0.08789867162704468
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,256,2,64,power_law_1.2,0.6436672210693359
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,7168,2048,8,256,4,32,balanced,0.08898133039474487
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,256,2,64,power_law_1.2,0.8600640296936035
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,7168,2048,8,256,4,32,balanced,0.08953600128491719
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,7168,2048,8,256,4,32,balanced,0.08981866637865703
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,256,2,64,power_law_1.2,1.4207039833068849
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,7168,2048,8,256,4,32,balanced,0.09067199627558391
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,256,2,64,power_law_1.2,1.7514047622680664
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,7168,2048,8,256,4,32,balanced,0.0920799970626831
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,7168,2048,8,256,4,32,balanced,0.092031995455424
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,256,2,64,power_law_1.2,2.0449024200439454
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,7168,2048,8,256,4,32,balanced,0.0953653355439504
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,7168,2048,8,256,4,32,balanced,0.09879466891288757
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,256,2,64,power_law_1.2,4.284844970703125
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,7168,2048,8,256,4,32,balanced,0.10225600004196167
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,7168,2048,8,256,4,32,balanced,0.04761599997679392
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,256,2,64,power_law_1.2,7.476633453369141
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,7168,2048,8,256,4,32,balanced,0.10272533694903056
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,7168,2048,8,256,4,32,balanced,0.048437332113583885
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,7168,2048,8,256,4,32,balanced,0.04769066472848257
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,7168,2048,8,256,4,32,balanced,0.10951466361681621
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,7168,2048,8,256,4,32,balanced,0.0517546683549881
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,7168,2048,8,256,4,32,balanced,0.11644267042477925
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,7168,2048,8,256,4,32,balanced,0.0543093333641688
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,7168,2048,8,256,4,32,balanced,0.06852266689141591
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,7168,2048,8,256,4,32,balanced,0.13050666451454163
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,7168,2048,8,256,4,32,balanced,0.043893332282702126
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,7168,2048,8,256,4,32,balanced,0.07089599967002869
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,7168,2048,8,256,4,32,balanced,0.04481600224971771
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,7168,2048,8,256,4,32,balanced,0.07154133419195811
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,7168,2048,8,256,4,32,balanced,0.14826666315396628
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,7168,2048,8,256,4,32,balanced,0.04444266855716705
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,7168,2048,8,256,4,32,balanced,0.0724533349275589
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,7168,2048,8,256,4,32,balanced,0.04854399959246317
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,7168,2048,8,256,4,32,balanced,0.07298133273919423
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,7168,2048,8,256,4,32,balanced,0.16685332854588827
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,7168,2048,8,256,4,32,balanced,0.05303466816743215
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,7168,2048,8,256,4,32,balanced,0.07445333401362102
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,7168,2048,8,256,4,32,balanced,0.06736533343791962
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,7168,2048,8,256,4,32,balanced,0.07541866600513458
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,7168,2048,8,256,4,32,balanced,0.19182932376861572
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,7168,2048,8,256,4,32,balanced,0.06911999980608623
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,7168,2048,8,256,4,32,balanced,0.07718933125336964
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,7168,2048,8,256,4,32,power_law_1.01,0.10637439489364624
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,7168,2048,8,256,4,32,balanced,0.06989333530267079
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,7168,2048,8,256,4,32,balanced,0.07876266539096832
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,7168,2048,8,256,4,32,balanced,0.07020266850789388
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,7168,2048,8,256,4,32,power_law_1.01,0.0833791971206665
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,7168,2048,8,256,4,32,balanced,0.08387200037638347
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,7168,2048,8,256,4,32,balanced,0.2556106646855672
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,7168,2048,8,256,4,32,balanced,0.0708000014225642
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,7168,2048,8,256,4,32,balanced,0.08568533261617024
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,7168,2048,8,256,4,32,power_law_1.01,0.08246399760246277
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,7168,2048,8,256,4,32,balanced,0.07197866837183635
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,7168,2048,8,256,4,32,balanced,0.08994666735331218
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,7168,2048,8,256,4,32,power_law_1.01,0.06732800006866455
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,7168,2048,8,256,4,32,balanced,0.07301866511503856
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,7168,2048,8,256,4,32,balanced,0.10045866171518962
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,7168,2048,8,256,4,32,power_law_1.01,0.06896640062332153
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,7168,2048,8,256,4,32,balanced,0.0745600014925003
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,7168,2048,8,256,4,32,power_law_1.01,0.06966400146484375
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,7168,2048,8,256,4,32,balanced,0.3099466760953267
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,7168,2048,8,256,4,32,balanced,0.1111893355846405
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,7168,2048,8,256,4,32,power_law_1.01,0.07640320062637329
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,7168,2048,8,256,4,32,balanced,0.07530666887760162
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,7168,2048,8,256,4,32,power_law_1.01,0.06570879817008972
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,7168,2048,8,256,4,32,balanced,0.08054399987061818
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,7168,2048,8,256,4,32,power_law_1.01,0.0810368001461029
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,7168,2048,8,256,4,32,balanced,0.1320373316605886
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,7168,2048,8,256,4,32,power_law_1.01,0.05283839702606201
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,7168,2048,8,256,4,32,balanced,0.08250666658083598
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,7168,2048,8,256,4,32,power_law_1.01,0.08327680230140685
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,7168,2048,8,256,4,32,balanced,0.1495413382848104
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,7168,2048,8,256,4,32,balanced,0.08571733037630717
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,7168,2048,8,256,4,32,power_law_1.01,0.05749760270118713
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,7168,2048,8,256,4,32,power_law_1.01,0.08590720295906067
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,7168,2048,8,256,4,32,power_law_1.01,0.05978239774703979
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,7168,2048,8,256,4,32,power_law_1.01,0.08398720026016235
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,7168,2048,8,256,4,32,balanced,0.40456533432006836
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,7168,2048,8,256,4,32,balanced,0.18819733460744223
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,7168,2048,8,256,4,32,power_law_1.01,0.06424319744110107
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,7168,2048,8,256,4,32,balanced,0.09728533029556274
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,7168,2048,8,256,4,32,power_law_1.01,0.08712319731712341
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,7168,2048,8,256,4,32,power_law_1.01,0.06418560147285461
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,7168,2048,8,256,4,32,power_law_1.01,0.09098880290985108
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,7168,2048,8,256,4,32,power_law_1.01,0.0670527994632721
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,7168,2048,8,256,4,32,balanced,0.22261865933736166
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,7168,2048,8,256,4,32,power_law_1.01,0.09115520119667053
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,7168,2048,8,256,4,32,power_law_1.01,0.06919040083885193
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,7168,2048,8,256,4,32,power_law_1.01,0.09795839786529541
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,7168,2048,8,256,4,32,power_law_1.01,0.07022719979286193
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,256,4,32,balanced,0.10679466525713603
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,7168,2048,8,256,4,32,power_law_1.01,0.10976639986038209
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,7168,2048,8,256,4,32,balanced,0.301749328772227
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,7168,2048,8,256,4,32,power_law_1.01,0.07200000286102295
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,7168,2048,8,256,4,32,power_law_1.01,0.1098688006401062
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,256,4,32,balanced,0.126309335231781
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,7168,2048,8,256,4,32,balanced,0.5326773325602213
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,7168,2048,8,256,4,32,power_law_1.01,0.0719488024711609
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,7168,2048,8,256,4,32,power_law_1.01,0.11038719415664673
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,7168,2048,8,256,4,32,power_law_1.01,0.07607679963111877
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,256,4,32,balanced,0.13900267084439596
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,7168,2048,8,256,4,32,power_law_1.01,0.07958400249481201
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,7168,2048,8,256,4,32,power_law_1.01,0.13583359718322754
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,7168,2048,8,256,4,32,balanced,0.38121068477630615
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,7168,2048,8,256,4,32,power_law_1.01,0.08812159895896912
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,7168,2048,8,256,4,32,power_law_1.01,0.14332159757614135
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,7168,2048,8,256,4,32,power_law_1.01,0.0918079972267151
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,7168,2048,8,256,4,32,power_law_1.01,0.0989247977733612
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,7168,2048,8,256,4,32,power_law_1.01,0.17575039863586425
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,7168,2048,8,256,4,32,power_law_1.01,0.11832959651947021
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,7168,2048,8,256,4,32,power_law_1.01,0.19312000274658203
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,256,4,32,balanced,0.17866132656733194
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,7168,2048,8,256,4,32,power_law_1.01,0.1198848009109497
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,7168,2048,8,256,4,32,power_law_1.01,0.2490367889404297
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,7168,2048,8,256,4,32,power_law_1.01,0.1620800018310547
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,7168,2048,8,256,4,32,balanced,0.5276639858881632
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,7168,2048,8,256,4,32,balanced,0.663263996442159
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,7168,2048,8,256,4,32,power_law_1.01,0.18464640378952027
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,7168,2048,8,256,4,32,power_law_1.01,0.28419198989868166
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,256,4,32,balanced,0.20836265881856283
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,7168,2048,8,256,4,32,power_law_1.01,0.23161599636077881
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,7168,2048,8,256,4,32,power_law_1.01,0.3714240074157715
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,7168,2048,8,256,4,32,power_law_1.01,0.28072960376739503
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,7168,2048,8,256,4,32,power_law_1.01,0.07069439888000488
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,7168,2048,8,256,4,32,power_law_1.01,0.4609792232513428
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,7168,2048,8,256,4,32,power_law_1.01,0.38696320056915284
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,256,4,32,balanced,0.2935413320859273
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,7168,2048,8,256,4,32,power_law_1.01,0.652998399734497
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,7168,2048,8,256,4,32,power_law_1.01,0.06433280110359192
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,7168,2048,8,256,4,32,power_law_1.01,0.49754881858825684
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,7168,2048,8,256,4,32,power_law_1.01,0.055871999263763426
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,7168,2048,8,256,4,32,power_law_1.01,0.9133248329162598
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,7168,2048,8,256,4,32,power_law_1.01,0.6809599876403809
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,7168,2048,8,256,4,32,balanced,0.6762986977895101
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,7168,2048,8,256,4,32,power_law_1.01,0.05447040200233459
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,7168,2048,8,256,4,32,power_law_1.01,0.9330240249633789
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,7168,2048,8,256,4,32,power_law_1.01,1.0773823738098145
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,256,4,32,balanced,0.370138684908549
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,7168,2048,8,256,4,32,power_law_1.01,0.06036480069160462
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,7168,2048,8,256,4,32,power_law_1.01,1.1574975967407226
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,7168,2048,8,256,4,32,power_law_1.01,1.6182655334472655
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,7168,2048,8,256,4,32,power_law_1.01,0.062118399143219
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,7168,2048,8,256,4,32,power_law_1.01,1.7279167175292969
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,7168,2048,8,256,4,32,power_law_1.01,0.06669440269470214
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,7168,2048,8,256,4,32,power_law_1.01,3.196121597290039
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,7168,2048,8,256,4,32,power_law_1.01,0.06792960166931153
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,7168,2048,8,256,4,32,power_law_1.01,3.848223876953125
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,7168,2048,8,256,4,32,power_law_1.01,0.06858239769935608
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,7168,2048,8,256,4,32,balanced,0.9264106750488281
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,7168,2048,8,256,4,32,power_law_1.01,0.0697920024394989
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,7168,2048,8,256,4,32,power_law_1.2,0.10766719579696656
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,7168,2048,8,256,4,32,power_law_1.01,0.07141119837760926
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,7168,2048,8,256,4,32,balanced,0.8509120146433512
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,7168,2048,8,256,4,32,power_law_1.2,0.08327040076255798
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,7168,2048,8,256,4,32,power_law_1.01,0.07626240253448487
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,7168,2048,8,256,4,32,power_law_1.2,0.07029119729995728
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,256,4,32,balanced,0.5517760117848715
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,7168,2048,8,256,4,32,power_law_1.01,0.07588480114936828
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,7168,2048,8,256,4,32,power_law_1.2,0.066048002243042
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,7168,2048,8,256,4,32,power_law_1.01,0.08206719756126404
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,7168,2048,8,256,4,32,power_law_1.2,0.06967679858207702
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,7168,2048,8,256,4,32,power_law_1.01,0.09132159948348999
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,7168,2048,8,256,4,32,power_law_1.2,0.0722495973110199
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,7168,2048,8,256,4,32,power_law_1.01,0.09959040284156799
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,7168,2048,8,256,4,32,power_law_1.2,0.08018559813499451
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,7168,2048,8,256,4,32,power_law_1.01,0.10902400016784668
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,7168,2048,8,256,4,32,power_law_1.2,0.08334720134735107
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,256,4,32,balanced,0.7108159859975179
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,7168,2048,8,256,4,32,power_law_1.2,0.08436480164527893
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,7168,2048,8,256,4,32,power_law_1.01,0.12144639492034912
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,7168,2048,8,256,4,32,power_law_1.2,0.08674560189247131
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,7168,2048,8,256,4,32,power_law_1.2,0.08797439932823181
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,7168,2048,8,256,4,32,power_law_1.2,0.0883903980255127
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,256,4,32,power_law_1.01,0.1356927990913391
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,7168,2048,8,256,4,32,power_law_1.2,0.08934400081634522
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,7168,2048,8,256,4,32,balanced,1.3034613132476807
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,256,4,32,power_law_1.01,0.16792960166931153
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,7168,2048,8,256,4,32,power_law_1.2,0.09218559861183166
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,7168,2048,8,256,4,32,power_law_1.2,0.1137279987335205
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,256,4,32,power_law_1.01,0.21111679077148438
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,7168,2048,8,256,4,32,power_law_1.2,0.12471679449081421
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,7168,2048,8,256,4,32,power_law_1.2,0.12113920450210572
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,256,4,32,power_law_1.01,0.2858112096786499
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,7168,2048,8,256,4,32,power_law_1.2,0.1472000002861023
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,256,4,32,power_law_1.01,0.3780927896499634
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,7168,2048,8,256,4,32,power_law_1.2,0.14988800287246704
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,256,4,32,balanced,0.8889973163604736
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,256,4,32,power_law_1.01,0.500051212310791
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,7168,2048,8,256,4,32,power_law_1.2,0.1868224024772644
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,7168,2048,8,256,4,32,power_law_1.2,0.06874880194664001
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,256,4,32,power_law_1.01,0.6450560092926025
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,7168,2048,8,256,4,32,power_law_1.2,0.20764799118041993
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,7168,2048,8,256,4,32,power_law_1.2,0.061977601051330565
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,7168,2048,8,256,4,32,balanced,1.8301706314086914
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,7168,2048,8,256,4,32,power_law_1.2,0.05418879985809326
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,7168,2048,8,256,4,32,power_law_1.2,0.2636735916137695
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,7168,2048,8,256,4,32,power_law_1.2,0.05671679973602295
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,7168,2048,8,256,4,32,power_law_1.2,0.3245311975479126
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,256,4,32,power_law_1.01,0.9511679649353028
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,7168,2048,8,256,4,32,power_law_1.2,0.05658239722251892
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,7168,2048,8,256,4,32,power_law_1.2,0.4376704216003418
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,256,4,32,power_law_1.01,1.1798080444335937
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,7168,2048,8,256,4,32,power_law_1.2,0.06199679970741272
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,7168,2048,8,256,4,32,power_law_1.2,0.5465727806091308
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,7168,2048,8,256,4,32,power_law_1.2,0.06602879762649536
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,7168,2048,8,256,4,32,power_law_1.2,0.7611328125
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,256,4,32,power_law_1.01,1.6761663436889649
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,7168,2048,8,256,4,32,power_law_1.2,0.06872320175170898
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,7168,2048,8,256,4,32,power_law_1.2,1.087936019897461
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,7168,2048,8,256,4,32,power_law_1.2,0.0683135986328125
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,256,4,32,power_law_1.01,2.67578239440918
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,7168,2048,8,256,4,32,power_law_1.2,1.2628607749938965
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,7168,2048,8,256,4,32,power_law_1.2,0.07167360186576843
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,256,4,32,balanced,1.3698612848917644
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,256,4,32,power_law_1.01,4.951129531860351
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,7168,2048,8,256,4,32,power_law_1.2,0.0735871970653534
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,7168,2048,8,256,4,32,power_law_1.2,2.612486457824707
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,7168,2048,8,256,4,32,power_law_1.2,0.07440639734268188
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,7168,2048,8,256,4,32,power_law_1.2,4.610521697998047
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,7168,2048,8,256,4,32,power_law_1.2,0.07887359857559204
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,7168,2048,8,256,4,32,power_law_1.2,0.07978240251541138
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,7168,2048,8,256,4,32,power_law_1.2,0.09088000059127807
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,7168,2048,8,256,4,32,balanced,2.547327995300293
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,7168,2048,8,256,4,32,power_law_1.2,0.09639040231704712
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,7168,2048,8,256,4,32,power_law_1.2,0.09997439980506898
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,7168,2048,8,256,4,32,power_law_1.2,0.1235967993736267
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,7168,2048,8,256,4,32,power_law_1.2,0.1398975968360901
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,7168,2048,8,256,4,32,power_law_1.2,0.1619647979736328
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,7168,2048,8,256,4,32,power_law_1.2,0.2007807970046997
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,7168,2048,8,256,4,32,power_law_1.2,0.2645632028579712
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,7168,2048,8,256,4,32,power_law_1.2,0.3188159942626953
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,7168,2048,8,256,4,32,power_law_1.2,0.42946557998657225
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,7168,2048,8,256,4,32,power_law_1.2,0.5495423793792724
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,7168,2048,8,256,4,32,power_law_1.2,0.7808383941650391
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,7168,2048,8,256,4,32,power_law_1.2,1.1397952079772948
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,7168,2048,8,256,4,32,power_law_1.2,1.3942463874816895
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,7168,2048,8,256,4,32,power_law_1.2,2.2453567504882814
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,7168,2048,8,256,4,32,power_law_1.2,4.769068908691406
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,256,4,32,balanced,2.7286399205525718
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,7168,2048,8,256,8,16,balanced,0.054842665791511536
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,7168,2048,8,256,8,16,balanced,0.055045331517855324
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,7168,2048,8,256,4,32,power_law_1.2,0.07057279944419861
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,7168,2048,8,256,8,16,balanced,0.05539733171463013
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,7168,2048,8,256,4,32,power_law_1.2,0.06467199921607972
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,7168,2048,8,256,8,16,balanced,0.061797335743904114
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,7168,2048,8,256,8,16,balanced,0.0710346649090449
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,7168,2048,8,256,4,32,power_law_1.2,0.04984320104122162
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,7168,2048,8,256,8,16,balanced,0.0885653297106425
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,7168,2048,8,256,4,32,power_law_1.2,0.05491200089454651
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,7168,2048,8,256,8,16,balanced,0.0897173285484314
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,7168,2048,8,256,4,32,power_law_1.2,0.057740801572799684
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,7168,2048,8,256,8,16,balanced,0.09125333031018575
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,7168,2048,8,256,4,32,power_law_1.2,0.06247040033340454
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,7168,2048,8,256,8,16,balanced,0.09098666906356812
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,7168,2048,8,256,4,32,power_law_1.2,0.06589440107345582
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,7168,2048,8,256,8,16,balanced,0.09134933352470398
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,7168,2048,8,256,4,32,power_law_1.2,0.0667136013507843
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,7168,2048,8,256,8,16,balanced,0.09276266892751057
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,7168,2048,8,256,8,16,balanced,0.0939520001411438
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,7168,2048,8,256,4,32,power_law_1.2,0.0671231985092163
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,7168,2048,8,256,8,16,balanced,0.09422399600346883
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,7168,2048,8,256,4,32,power_law_1.2,0.06845440268516541
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,7168,2048,8,256,8,16,balanced,0.09644800424575806
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,7168,2048,8,256,4,32,power_law_1.2,0.07063040137290955
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,7168,2048,8,256,8,16,balanced,0.10095466176668803
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,7168,2048,8,256,4,32,power_law_1.2,0.07417600154876709
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,7168,2048,8,256,8,16,balanced,0.10141866405804952
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,7168,2048,8,256,4,32,power_law_1.2,0.07893120050430298
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,7168,2048,8,256,4,32,power_law_1.2,0.08210560083389282
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,7168,2048,8,256,8,16,balanced,0.10564266641934712
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,7168,2048,8,256,4,32,power_law_1.2,0.0986240029335022
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,7168,2048,8,256,8,16,balanced,0.11400533715883891
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,7168,2048,8,256,4,32,power_law_1.2,0.10483839511871337
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,7168,2048,8,256,8,16,balanced,0.12592533230781555
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,7168,2048,8,256,4,32,power_law_1.2,0.1095039963722229
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,7168,2048,8,256,8,16,balanced,0.1431893308957418
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,7168,2048,8,256,4,32,power_law_1.2,0.14788479804992677
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,7168,2048,8,256,8,16,balanced,0.1539520025253296
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,256,4,32,power_law_1.2,0.1412287950515747
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,7168,2048,8,256,8,16,balanced,0.18922666708628336
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,7168,2048,8,256,8,16,balanced,0.047151997685432434
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,256,4,32,power_law_1.2,0.19258879423141478
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,7168,2048,8,256,8,16,balanced,0.04794133206208547
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,256,4,32,power_law_1.2,0.2282815933227539
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,7168,2048,8,256,8,16,balanced,0.2131999929745992
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,7168,2048,8,256,8,16,balanced,0.047877331574757896
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,7168,2048,8,256,8,16,balanced,0.05282666782538096
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,256,4,32,power_law_1.2,0.3361088037490845
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,7168,2048,8,256,8,16,balanced,0.05691733459631602
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,7168,2048,8,256,8,16,balanced,0.07253866891066234
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,7168,2048,8,256,8,16,balanced,0.283786674340566
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,256,4,32,power_law_1.2,0.4179520130157471
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,7168,2048,8,256,8,16,balanced,0.07412800192832947
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,256,4,32,power_law_1.2,0.6242303848266602
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,7168,2048,8,256,8,16,balanced,0.07445333401362102
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,256,4,32,power_law_1.2,0.8634176254272461
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,7168,2048,8,256,8,16,balanced,0.07515199979146321
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,7168,2048,8,256,8,16,balanced,0.07600533465544383
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,7168,2048,8,256,8,16,balanced,0.35020267963409424
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,7168,2048,8,256,8,16,balanced,0.07725866635640462
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,256,4,32,power_law_1.2,1.2817472457885741
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,7168,2048,8,256,8,16,balanced,0.07796800136566162
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,7168,2048,8,256,8,16,balanced,0.04478933413823446
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,7168,2048,8,256,8,16,balanced,0.07967466612656911
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,256,4,32,power_law_1.2,1.6794303894042968
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,7168,2048,8,256,8,16,balanced,0.08213866750399272
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,7168,2048,8,256,8,16,balanced,0.04543466866016388
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,7168,2048,8,256,8,16,balanced,0.0466186652580897
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,7168,2048,8,256,8,16,balanced,0.08649599552154541
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,7168,2048,8,256,8,16,power_law_1.01,0.07757440209388733
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,256,4,32,power_law_1.2,2.3074880599975587
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,7168,2048,8,256,8,16,power_law_1.01,0.06575999855995178
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,7168,2048,8,256,8,16,balanced,0.0517493337392807
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,7168,2048,8,256,8,16,balanced,0.4684160153071086
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,7168,2048,8,256,8,16,balanced,0.0897653301556905
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,7168,2048,8,256,8,16,power_law_1.01,0.09376000165939331
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,7168,2048,8,256,8,16,balanced,0.05834666887919108
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,7168,2048,8,256,8,16,power_law_1.01,0.06815360188484192
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,7168,2048,8,256,8,16,power_law_1.01,0.06847360134124755
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,256,4,32,power_law_1.2,3.9178497314453127
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,7168,2048,8,256,8,16,balanced,0.0937493344148
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,7168,2048,8,256,8,16,balanced,0.07215466598669688
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,7168,2048,8,256,8,16,power_law_1.01,0.06643199920654297
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,7168,2048,8,256,8,16,power_law_1.01,0.05422080159187317
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,7168,2048,8,256,8,16,balanced,0.07460266848405202
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,7168,2048,8,256,8,16,power_law_1.01,0.06874880194664001
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,7168,2048,8,256,8,16,balanced,0.10746133327484131
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,7168,2048,8,256,8,16,balanced,0.07481599847475688
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,256,4,32,power_law_1.2,7.078092956542969
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,7168,2048,8,256,8,16,power_law_1.01,0.07220479846000671
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,7168,2048,8,256,8,16,power_law_1.01,0.05626239776611328
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,7168,2048,8,256,8,16,power_law_1.01,0.07976959943771363
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,7168,2048,8,256,8,16,balanced,0.07579199969768524
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,7168,2048,8,256,8,16,balanced,0.12104533116022746
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,7168,2048,8,256,8,16,power_law_1.01,0.05863040089607239
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,7168,2048,8,256,8,16,power_law_1.01,0.08309119939804077
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,7168,2048,8,256,8,16,balanced,0.0758240024248759
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,7168,2048,8,256,8,16,power_law_1.01,0.08511360287666321
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,7168,2048,8,256,8,16,balanced,0.14136000474294028
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,7168,2048,8,256,8,16,power_law_1.01,0.06280959844589233
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,7168,2048,8,256,8,16,balanced,0.07826133569081624
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,7168,2048,8,256,8,16,power_law_1.01,0.08568959832191467
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,7168,2048,8,256,8,16,balanced,0.0795413355032603
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,7168,2048,8,256,8,16,power_law_1.01,0.06893439888954163
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,7168,2048,8,256,8,16,balanced,0.6118880112965902
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,7168,2048,8,256,8,16,power_law_1.01,0.08857600092887878
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,7168,2048,8,256,8,16,balanced,0.16244266430536905
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,7168,2048,8,256,8,16,power_law_1.01,0.09071999788284302
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,7168,2048,8,256,8,16,balanced,0.08144533137480418
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,7168,2048,8,256,8,16,power_law_1.01,0.06928640007972717
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,7168,2048,8,256,8,16,power_law_1.01,0.09268479943275451
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,7168,2048,8,256,8,16,balanced,0.08255999783674876
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,7168,2048,8,256,8,16,power_law_1.01,0.09972479939460754
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,7168,2048,8,256,8,16,power_law_1.01,0.07038080096244811
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,7168,2048,8,256,8,16,balanced,0.20266133546829224
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,7168,2048,8,256,8,16,power_law_1.01,0.10373120307922364
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,7168,2048,8,256,8,16,balanced,0.08949866890907288
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,7168,2048,8,256,8,16,power_law_1.01,0.07111039757728577
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,7168,2048,8,256,8,16,power_law_1.01,0.11304960250854493
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,7168,2048,8,256,8,16,balanced,0.09169066945711772
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,7168,2048,8,256,8,16,power_law_1.01,0.11365760564804077
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,7168,2048,8,256,8,16,power_law_1.01,0.07431679964065552
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,7168,2048,8,256,8,16,balanced,0.09572266538937886
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,7168,2048,8,256,8,16,power_law_1.01,0.12769919633865356
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,7168,2048,8,256,8,16,balanced,0.24553066492080688
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,7168,2048,8,256,8,16,power_law_1.01,0.07584000229835511
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,7168,2048,8,256,8,16,power_law_1.01,0.14281599521636962
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,7168,2048,8,256,8,16,power_law_1.01,0.07985919713973999
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,7168,2048,8,256,8,16,power_law_1.01,0.16376320123672486
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,7168,2048,8,256,8,16,power_law_1.01,0.202508807182312
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,7168,2048,8,256,8,16,power_law_1.01,0.08487039804458618
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,7168,2048,8,256,8,16,balanced,0.11376532912254333
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,7168,2048,8,256,8,16,balanced,0.782591978708903
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,7168,2048,8,256,8,16,power_law_1.01,0.23916800022125245
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,7168,2048,8,256,8,16,power_law_1.01,0.0908415973186493
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,7168,2048,8,256,8,16,balanced,0.3283413251241048
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,7168,2048,8,256,8,16,power_law_1.01,0.29553918838500975
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,7168,2048,8,256,8,16,power_law_1.01,0.09852160215377807
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,7168,2048,8,256,8,16,power_law_1.01,0.3596224069595337
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,7168,2048,8,256,8,16,power_law_1.01,0.10371840000152588
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,7168,2048,8,256,8,16,power_law_1.01,0.4961343765258789
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,7168,2048,8,256,8,16,power_law_1.01,0.11793919801712036
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,7168,2048,8,256,8,16,power_law_1.01,0.6401343822479248
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,256,8,16,balanced,0.12796800335248312
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,7168,2048,8,256,8,16,power_law_1.01,0.13842560052871705
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,7168,2048,8,256,8,16,power_law_1.01,0.9148544311523438
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,7168,2048,8,256,8,16,power_law_1.2,0.0791808009147644
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,7168,2048,8,256,8,16,balanced,0.4247200091679891
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,7168,2048,8,256,8,16,power_law_1.01,1.046444797515869
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,7168,2048,8,256,8,16,power_law_1.01,0.16789120435714722
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,256,8,16,balanced,0.15389866630236307
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,7168,2048,8,256,8,16,power_law_1.2,0.0883903980255127
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,7168,2048,8,256,8,16,power_law_1.01,1.6079999923706054
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,7168,2048,8,256,8,16,power_law_1.01,0.19286400079727173
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,7168,2048,8,256,8,16,power_law_1.2,0.06096640229225159
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,256,8,16,balanced,0.16830400625864664
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,7168,2048,8,256,8,16,power_law_1.01,3.577996826171875
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,7168,2048,8,256,8,16,power_law_1.01,0.2517632007598877
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,7168,2048,8,256,8,16,power_law_1.2,0.06379520297050476
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,7168,2048,8,256,8,16,power_law_1.01,0.06185600161552429
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,7168,2048,8,256,8,16,power_law_1.01,0.3104703903198242
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,7168,2048,8,256,8,16,power_law_1.2,0.06836479902267456
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,7168,2048,8,256,8,16,power_law_1.01,0.07429119944572449
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,7168,2048,8,256,8,16,power_law_1.01,0.40039677619934083
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,7168,2048,8,256,8,16,balanced,0.5970453421274821
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,7168,2048,8,256,8,16,power_law_1.2,0.07226240038871765
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,7168,2048,8,256,8,16,power_law_1.01,0.05345919728279114
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,256,8,16,balanced,0.22860799233118692
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,7168,2048,8,256,8,16,power_law_1.01,0.5158336162567139
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,7168,2048,8,256,8,16,power_law_1.2,0.07938560247421264
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,7168,2048,8,256,8,16,power_law_1.01,0.056601601839065555
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,7168,2048,8,256,8,16,power_law_1.2,0.08257920145988465
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,7168,2048,8,256,8,16,power_law_1.01,0.7626880168914795
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,7168,2048,8,256,8,16,balanced,1.1291840076446533
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,7168,2048,8,256,8,16,power_law_1.01,0.06099200248718262
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,256,8,16,balanced,0.2797226707140605
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,7168,2048,8,256,8,16,power_law_1.2,0.08416640162467956
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,7168,2048,8,256,8,16,power_law_1.01,0.9889087677001953
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,7168,2048,8,256,8,16,power_law_1.01,0.06683520078659058
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,7168,2048,8,256,8,16,power_law_1.2,0.08440960049629212
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,7168,2048,8,256,8,16,power_law_1.01,1.2196928024291993
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,7168,2048,8,256,8,16,power_law_1.01,0.06980479955673217
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,7168,2048,8,256,8,16,power_law_1.2,0.08804479837417603
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,7168,2048,8,256,8,16,power_law_1.01,0.07324159741401673
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,256,8,16,balanced,0.41839468479156494
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,7168,2048,8,256,8,16,power_law_1.01,1.911814308166504
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,7168,2048,8,256,8,16,power_law_1.2,0.0900160014629364
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,7168,2048,8,256,8,16,balanced,0.7736586729685465
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,7168,2048,8,256,8,16,power_law_1.01,0.07490559816360473
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,7168,2048,8,256,8,16,power_law_1.2,0.0946175992488861
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,7168,2048,8,256,8,16,power_law_1.01,3.9372161865234374
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,7168,2048,8,256,8,16,power_law_1.01,0.07496960163116455
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,7168,2048,8,256,8,16,power_law_1.2,0.09528959989547729
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,7168,2048,8,256,8,16,power_law_1.2,0.10680320262908935
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,7168,2048,8,256,8,16,power_law_1.01,0.0815936028957367
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,256,8,16,balanced,0.5188639958699545
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,7168,2048,8,256,8,16,power_law_1.2,0.11665920019149781
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,7168,2048,8,256,8,16,power_law_1.01,0.08349440097808838
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,7168,2048,8,256,8,16,power_law_1.2,0.11627520322799682
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,7168,2048,8,256,8,16,power_law_1.01,0.08501120209693909
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,7168,2048,8,256,8,16,power_law_1.2,0.1334272027015686
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,7168,2048,8,256,8,16,power_law_1.01,0.09155200123786926
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,7168,2048,8,256,8,16,power_law_1.2,0.14659839868545532
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,7168,2048,8,256,8,16,power_law_1.01,0.09889919757843017
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,7168,2048,8,256,8,16,balanced,0.9794027010599772
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,7168,2048,8,256,8,16,power_law_1.2,0.183513605594635
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,7168,2048,8,256,8,16,power_law_1.01,0.10280959606170655
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,7168,2048,8,256,8,16,power_law_1.2,0.20814719200134277
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,7168,2048,8,256,8,16,power_law_1.01,0.12208000421524048
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,7168,2048,8,256,8,16,power_law_1.2,0.26124160289764403
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,256,8,16,balanced,0.7533760070800781
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,7168,2048,8,256,8,16,power_law_1.01,0.1384511947631836
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,7168,2048,8,256,8,16,power_law_1.2,0.3104896068572998
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,7168,2048,8,256,8,16,power_law_1.2,0.42441601753234864
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,256,8,16,power_law_1.01,0.16110080480575562
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,7168,2048,8,256,8,16,power_law_1.2,0.5478911876678467
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,256,8,16,power_law_1.01,0.20604159832000732
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,7168,2048,8,256,8,16,power_law_1.2,0.8080896377563477
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,256,8,16,power_law_1.01,0.2732928037643433
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,7168,2048,8,256,8,16,power_law_1.2,1.0784128189086915
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,7168,2048,8,256,8,16,power_law_1.2,1.3465087890625
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,256,8,16,balanced,0.9710666338602701
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,256,8,16,power_law_1.01,0.350272011756897
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,7168,2048,8,256,8,16,power_law_1.2,2.0641984939575195
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,256,8,16,power_law_1.01,0.43230719566345216
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,7168,2048,8,256,8,16,balanced,2.1599413553873696
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,256,8,16,power_law_1.01,0.5741055965423584
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,7168,2048,8,256,8,16,balanced,1.4567039807637532
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,7168,2048,8,256,8,16,power_law_1.2,4.499596786499024
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,256,8,16,power_law_1.01,0.7845759868621827
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,256,8,16,power_law_1.01,1.1960384368896484
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,256,8,16,power_law_1.01,1.5492159843444824
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,256,8,16,balanced,1.2090400060017903
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,256,8,16,power_law_1.01,2.044576072692871
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,256,8,16,power_law_1.01,2.9106943130493166
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,256,8,16,power_law_1.01,6.464832305908203
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,256,8,16,balanced,1.8819093704223633
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,7168,2048,8,256,8,16,power_law_1.2,0.06235520243644714
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,7168,2048,8,256,8,16,power_law_1.2,0.06833919882774353
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,7168,2048,8,256,8,16,power_law_1.2,0.05196800231933594
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,7168,2048,8,256,8,16,balanced,2.8692906697591147
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,7168,2048,8,256,8,16,power_law_1.2,0.05597440004348755
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,7168,2048,8,256,8,16,power_law_1.2,0.05809919834136963
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,7168,2048,8,256,8,16,power_law_1.2,0.062009602785110474
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,7168,2048,8,256,8,16,power_law_1.2,0.06637439727783204
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,7168,2048,8,256,8,16,power_law_1.2,0.06780160069465638
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,7168,2048,8,256,8,16,power_law_1.2,0.0716480016708374
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,7168,2048,8,256,8,16,power_law_1.2,0.07097600102424621
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,7168,2048,8,256,8,16,power_law_1.2,0.07352960109710693
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,7168,2048,8,256,8,16,power_law_1.2,0.07772160172462464
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,7168,2048,8,256,8,16,power_law_1.2,0.0808896005153656
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,7168,2048,8,256,8,16,power_law_1.2,0.08513919711112976
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,7168,2048,8,256,8,16,power_law_1.2,0.0936191976070404
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,7168,2048,8,256,8,16,power_law_1.2,0.09895039796829223
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,7168,2048,8,256,8,16,power_law_1.2,0.10292479991912842
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,7168,2048,8,256,8,16,power_law_1.2,0.12153600454330445
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,7168,2048,8,256,8,16,power_law_1.2,0.14243839979171752
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,7168,2048,8,256,8,16,power_law_1.2,0.17793279886245728
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,7168,2048,8,256,8,16,power_law_1.2,0.06092159748077393
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,256,8,16,balanced,3.746005376180013
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,7168,2048,8,256,8,16,power_law_1.2,0.2079103946685791
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,7168,2048,8,256,8,16,power_law_1.2,0.07081599831581116
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,7168,2048,8,256,8,16,power_law_1.2,0.2696448087692261
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,7168,2048,8,256,8,16,power_law_1.2,0.04874880015850067
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,7168,2048,8,256,8,16,power_law_1.2,0.33056640625
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,7168,2048,8,256,8,16,power_law_1.2,0.05617280006408691
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,7168,2048,8,256,8,16,power_law_1.2,0.06087039709091187
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,7168,2048,8,256,8,16,power_law_1.2,0.47251200675964355
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,7168,2048,8,256,8,16,power_law_1.2,0.06563839912414551
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,7168,2048,8,256,8,16,power_law_1.2,0.5343616008758545
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,7168,2048,8,256,8,16,power_law_1.2,0.07032960057258605
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,7168,2048,8,256,8,16,power_law_1.2,0.07354239821434021
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,7168,2048,8,256,8,16,power_law_1.2,0.8860032081604003
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,7168,2048,8,256,8,16,power_law_1.2,0.07463039755821228
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,7168,2048,8,256,8,16,power_law_1.2,1.230131244659424
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,7168,2048,8,256,8,16,power_law_1.2,0.07561600208282471
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,7168,2048,8,256,8,16,power_law_1.2,0.07984640002250672
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,7168,2048,8,256,8,16,power_law_1.2,1.3470272064208983
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,7168,2048,8,256,8,16,power_law_1.2,0.08451200127601624
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,7168,2048,8,256,8,16,power_law_1.2,0.08694400191307068
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,7168,2048,8,256,8,16,power_law_1.2,2.201081657409668
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,7168,2048,8,256,8,16,power_law_1.2,0.09568639993667602
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,7168,2048,8,256,8,16,power_law_1.2,0.10533119440078735
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,7168,2048,8,256,8,16,power_law_1.2,5.0870208740234375
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,7168,2048,8,256,8,16,power_law_1.2,0.11455359458923339
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,7168,2048,8,256,8,16,power_law_1.2,0.126310396194458
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,7168,2048,8,256,16,8,balanced,0.0551093320051829
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,7168,2048,8,256,16,8,balanced,0.05478399991989136
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,7168,2048,8,256,8,16,power_law_1.2,0.15199359655380248
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,7168,2048,8,256,16,8,balanced,0.056330665946006775
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,7168,2048,8,256,16,8,balanced,0.07340266803900401
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,256,8,16,power_law_1.2,0.15941760540008545
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,7168,2048,8,256,16,8,balanced,0.07478933533032735
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,256,8,16,power_law_1.2,0.21033599376678466
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,7168,2048,8,256,16,8,balanced,0.09621333082516988
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,256,8,16,power_law_1.2,0.31772799491882325
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,7168,2048,8,256,16,8,balanced,0.09708266456921895
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,256,8,16,power_law_1.2,0.4174335956573486
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,7168,2048,8,256,16,8,balanced,0.09807999928792317
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,256,8,16,power_law_1.2,0.5423999786376953
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,7168,2048,8,256,16,8,balanced,0.0974720021088918
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,256,8,16,power_law_1.2,0.7564479827880859
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,7168,2048,8,256,16,8,balanced,0.0993226667245229
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,256,8,16,power_law_1.2,1.1342016220092774
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,7168,2048,8,256,16,8,balanced,0.09995733698209126
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,7168,2048,8,256,16,8,balanced,0.10139200091362
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,256,8,16,power_law_1.2,1.4465215682983399
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,7168,2048,8,256,16,8,balanced,0.10177600383758545
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,256,8,16,power_law_1.2,1.9637823104858398
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,7168,2048,8,256,16,8,balanced,0.04769066472848257
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,7168,2048,8,256,16,8,balanced,0.10448533296585083
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,256,8,16,power_law_1.2,2.5698944091796876
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,7168,2048,8,256,16,8,balanced,0.04846400022506714
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,7168,2048,8,256,16,8,balanced,0.11129599809646606
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,7168,2048,8,256,16,8,balanced,0.049285332361857094
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,256,8,16,power_law_1.2,4.111072158813476
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,7168,2048,8,256,16,8,balanced,0.11373866597811381
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,7168,2048,8,256,16,8,balanced,0.05515199899673462
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,7168,2048,8,256,16,8,balanced,0.11640533804893494
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,256,8,16,power_law_1.2,8.377536010742187
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,7168,2048,8,256,16,8,balanced,0.06294399996598561
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,7168,2048,8,256,16,8,balanced,0.1293653349081675
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,7168,2048,8,256,16,8,balanced,0.08124800026416779
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,7168,2048,8,256,16,8,balanced,0.04730666677157084
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,7168,2048,8,256,16,8,balanced,0.08237333099047343
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,7168,2048,8,256,16,8,balanced,0.05053333441416422
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,7168,2048,8,256,16,8,balanced,0.1479200025399526
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,7168,2048,8,256,16,8,balanced,0.08277866741021474
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,7168,2048,8,256,16,8,balanced,0.052426666021347046
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,7168,2048,8,256,16,8,balanced,0.08387733499209087
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,7168,2048,8,256,16,8,balanced,0.16014400124549866
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,7168,2048,8,256,16,8,balanced,0.05946666498978933
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,7168,2048,8,256,16,8,balanced,0.08418132861455281
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,7168,2048,8,256,16,8,balanced,0.06674133241176605
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,7168,2048,8,256,16,8,balanced,0.1793173352877299
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,7168,2048,8,256,16,8,balanced,0.08556266625722249
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,7168,2048,8,256,16,8,balanced,0.08523199955622356
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,7168,2048,8,256,16,8,balanced,0.08718400200208028
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,7168,2048,8,256,16,8,balanced,0.087909330924352
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,7168,2048,8,256,16,8,balanced,0.2165279984474182
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,7168,2048,8,256,16,8,balanced,0.08884800473848979
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,7168,2048,8,256,16,8,power_law_1.01,0.0605567991733551
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,7168,2048,8,256,16,8,balanced,0.08958933750788371
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,7168,2048,8,256,16,8,balanced,0.09021332859992981
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,7168,2048,8,256,16,8,power_law_1.01,0.07522559762001038
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,7168,2048,8,256,16,8,balanced,0.08999466896057129
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,7168,2048,8,256,16,8,balanced,0.09761599699656169
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,7168,2048,8,256,16,8,balanced,0.2580746610959371
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,7168,2048,8,256,16,8,power_law_1.01,0.06224640011787415
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,7168,2048,8,256,16,8,balanced,0.09110933542251587
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,7168,2048,8,256,16,8,balanced,0.10054399569829305
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,7168,2048,8,256,16,8,power_law_1.01,0.06963840126991272
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,7168,2048,8,256,16,8,balanced,0.09259733557701111
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,7168,2048,8,256,16,8,balanced,0.10630933443705241
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,7168,2048,8,256,16,8,power_law_1.01,0.06918399930000305
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,7168,2048,8,256,16,8,balanced,0.09573333462079366
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,7168,2048,8,256,16,8,balanced,0.3510400056838989
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,7168,2048,8,256,16,8,balanced,0.12077333529790242
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,7168,2048,8,256,16,8,power_law_1.01,0.0743552029132843
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,7168,2048,8,256,16,8,balanced,0.09851732850074768
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,7168,2048,8,256,16,8,power_law_1.01,0.08485760092735291
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,7168,2048,8,256,16,8,balanced,0.13640532890955606
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,7168,2048,8,256,16,8,balanced,0.10151466727256775
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,7168,2048,8,256,16,8,power_law_1.01,0.08616960048675537
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,7168,2048,8,256,16,8,balanced,0.10962667067845662
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,7168,2048,8,256,16,8,balanced,0.16038933396339417
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,7168,2048,8,256,16,8,power_law_1.01,0.08922240138053894
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,7168,2048,8,256,16,8,balanced,0.1125973363717397
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,7168,2048,8,256,16,8,balanced,0.44434134165445965
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,7168,2048,8,256,16,8,power_law_1.01,0.08883839845657349
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,7168,2048,8,256,16,8,balanced,0.18425599733988443
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,7168,2048,8,256,16,8,balanced,0.11899200081825256
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,7168,2048,8,256,16,8,power_law_1.01,0.09191039800643921
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,7168,2048,8,256,16,8,power_law_1.01,0.09642239809036254
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,7168,2048,8,256,16,8,balanced,0.23879466454188028
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,7168,2048,8,256,16,8,balanced,0.14269333084424338
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,7168,2048,8,256,16,8,power_law_1.01,0.10013439655303955
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,7168,2048,8,256,16,8,power_law_1.01,0.10982400178909302
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,7168,2048,8,256,16,8,balanced,0.6183626651763916
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,7168,2048,8,256,16,8,power_law_1.01,0.05260800123214722
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,7168,2048,8,256,16,8,balanced,0.29316266377766925
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,7168,2048,8,256,16,8,power_law_1.01,0.11336959600448608
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,7168,2048,8,256,16,8,power_law_1.01,0.06293759942054748
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,7168,2048,8,256,16,8,power_law_1.01,0.1214400053024292
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,7168,2048,8,256,16,8,power_law_1.01,0.05053439736366272
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,256,16,8,balanced,0.16614400347073874
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,7168,2048,8,256,16,8,power_law_1.01,0.12309119701385499
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,7168,2048,8,256,16,8,balanced,0.40537599722544354
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,7168,2048,8,256,16,8,power_law_1.01,0.05564799904823303
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,7168,2048,8,256,16,8,power_law_1.01,0.14304640293121337
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,256,16,8,balanced,0.20859734217325845
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,7168,2048,8,256,16,8,power_law_1.01,0.06229119896888733
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,7168,2048,8,256,16,8,power_law_1.01,0.1542080044746399
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,7168,2048,8,256,16,8,power_law_1.01,0.06544640064239501
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,256,16,8,balanced,0.2424266735712687
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,7168,2048,8,256,16,8,power_law_1.01,0.20107519626617432
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,7168,2048,8,256,16,8,power_law_1.01,0.0723136007785797
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,7168,2048,8,256,16,8,balanced,0.7899839878082275
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,7168,2048,8,256,16,8,balanced,0.5176000197728475
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,7168,2048,8,256,16,8,power_law_1.01,0.07439360022544861
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,7168,2048,8,256,16,8,power_law_1.01,0.21335039138793946
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,7168,2048,8,256,16,8,power_law_1.01,0.07687039971351624
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,7168,2048,8,256,16,8,power_law_1.01,0.2731712102890015
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,7168,2048,8,256,16,8,power_law_1.01,0.07633280158042907
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,256,16,8,balanced,0.35097599029541016
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,7168,2048,8,256,16,8,power_law_1.01,0.312940788269043
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,7168,2048,8,256,16,8,power_law_1.01,0.08106240034103393
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,7168,2048,8,256,16,8,power_law_1.01,0.43686399459838865
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,7168,2048,8,256,16,8,power_law_1.01,0.08449280261993408
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,256,16,8,balanced,0.42186133066813153
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,7168,2048,8,256,16,8,power_law_1.01,0.08741120100021363
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,7168,2048,8,256,16,8,power_law_1.01,0.525932788848877
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,7168,2048,8,256,16,8,balanced,0.7385066350301107
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,7168,2048,8,256,16,8,power_law_1.01,0.09350399971008301
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,7168,2048,8,256,16,8,power_law_1.01,0.9159040451049805
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,7168,2048,8,256,16,8,power_law_1.01,0.10126080513000488
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,256,16,8,balanced,0.6254666646321615
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,7168,2048,8,256,16,8,balanced,1.0155839920043945
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,7168,2048,8,256,16,8,power_law_1.01,0.1048192024230957
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,7168,2048,8,256,16,8,power_law_1.01,1.0353280067443849
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,7168,2048,8,256,16,8,power_law_1.01,0.11218559741973877
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,7168,2048,8,256,16,8,power_law_1.01,1.2878656387329102
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,7168,2048,8,256,16,8,power_law_1.01,0.13575040102005004
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,7168,2048,8,256,16,8,power_law_1.01,1.8008319854736328
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,7168,2048,8,256,16,8,power_law_1.01,0.1453760027885437
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,256,16,8,balanced,0.7745599746704102
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,7168,2048,8,256,16,8,power_law_1.01,0.17757439613342285
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,7168,2048,8,256,16,8,balanced,0.9450613657633463
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,7168,2048,8,256,16,8,power_law_1.01,3.7379840850830077
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,7168,2048,8,256,16,8,power_law_1.01,0.21616001129150392
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,7168,2048,8,256,16,8,power_law_1.01,0.2790911912918091
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,7168,2048,8,256,16,8,power_law_1.01,0.33654398918151857
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,7168,2048,8,256,16,8,power_law_1.01,0.06094719767570496
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,7168,2048,8,256,16,8,power_law_1.01,0.4781951904296875
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,256,16,8,balanced,1.1390399932861328
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,7168,2048,8,256,16,8,power_law_1.01,0.06891520023345947
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,7168,2048,8,256,16,8,power_law_1.01,0.6459648132324218
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,7168,2048,8,256,16,8,power_law_1.01,0.05674239993095398
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,7168,2048,8,256,16,8,power_law_1.01,0.9007231712341308
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,7168,2048,8,256,16,8,power_law_1.01,0.06176000237464905
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,7168,2048,8,256,16,8,power_law_1.01,1.116851234436035
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,7168,2048,8,256,16,8,balanced,1.4723626772562664
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,7168,2048,8,256,16,8,power_law_1.01,0.0671999990940094
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,7168,2048,8,256,16,8,balanced,1.2073547045389812
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,7168,2048,8,256,16,8,power_law_1.2,0.06107519865036011
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,7168,2048,8,256,16,8,power_law_1.01,1.4458111763000487
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,7168,2048,8,256,16,8,power_law_1.01,0.07585920095443725
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,7168,2048,8,256,16,8,power_law_1.01,2.1158527374267577
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,7168,2048,8,256,16,8,power_law_1.01,0.0824512004852295
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,7168,2048,8,256,16,8,power_law_1.2,0.0746944010257721
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,256,16,8,balanced,1.4875893592834473
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,7168,2048,8,256,16,8,power_law_1.2,0.05686399936676025
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,7168,2048,8,256,16,8,power_law_1.01,0.08446080088615418
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,7168,2048,8,256,16,8,power_law_1.01,4.443750381469727
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,7168,2048,8,256,16,8,power_law_1.2,0.07242239713668823
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,7168,2048,8,256,16,8,power_law_1.01,0.08479999899864196
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,7168,2048,8,256,16,8,power_law_1.01,0.08828799724578858
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,7168,2048,8,256,16,8,power_law_1.2,0.06858879923820496
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,7168,2048,8,256,16,8,power_law_1.01,0.0908415973186493
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,7168,2048,8,256,16,8,power_law_1.2,0.07390080094337463
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,7168,2048,8,256,16,8,power_law_1.01,0.10081919431686401
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,7168,2048,8,256,16,8,power_law_1.01,0.10278400182723998
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,7168,2048,8,256,16,8,power_law_1.2,0.08169599771499633
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,7168,2048,8,256,16,8,power_law_1.01,0.10586240291595458
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,256,16,8,balanced,1.8522666295369465
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,7168,2048,8,256,16,8,power_law_1.2,0.08556159734725952
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,7168,2048,8,256,16,8,power_law_1.01,0.12212480306625366
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,7168,2048,8,256,16,8,power_law_1.2,0.08921599984169007
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,7168,2048,8,256,16,8,power_law_1.2,0.09005439877510071
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,7168,2048,8,256,16,8,power_law_1.01,0.1273344039916992
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,7168,2048,8,256,16,8,balanced,1.7960160573323567
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,7168,2048,8,256,16,8,power_law_1.2,0.09267839789390564
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,7168,2048,8,256,16,8,power_law_1.01,0.14505599737167357
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,7168,2048,8,256,16,8,power_law_1.2,0.09525759816169739
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,7168,2048,8,256,16,8,power_law_1.2,0.09806720018386841
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,7168,2048,8,256,16,8,power_law_1.01,0.17775360345840455
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,7168,2048,8,256,16,8,power_law_1.2,0.1102463960647583
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,7168,2048,8,256,16,8,power_law_1.2,0.12178560495376586
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,256,16,8,power_law_1.01,0.19413119554519653
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,7168,2048,8,256,16,8,power_law_1.2,0.12379519939422608
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,7168,2048,8,256,16,8,power_law_1.2,0.12903679609298707
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,256,16,8,power_law_1.01,0.254694390296936
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,7168,2048,8,256,16,8,power_law_1.2,0.15302400588989257
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,256,16,8,power_law_1.01,0.3376768112182617
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,7168,2048,8,256,16,8,power_law_1.2,0.17414400577545167
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,7168,2048,8,256,16,8,power_law_1.2,0.050988799333572386
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,7168,2048,8,256,16,8,power_law_1.2,0.20805120468139648
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,256,16,8,power_law_1.01,0.47966718673706055
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,7168,2048,8,256,16,8,power_law_1.2,0.061536002159118655
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,7168,2048,8,256,16,8,power_law_1.2,0.22929279804229735
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,256,16,8,power_law_1.01,0.5951039791107178
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,7168,2048,8,256,16,8,power_law_1.2,0.2866175889968872
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,256,16,8,balanced,2.908426602681478
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,7168,2048,8,256,16,8,power_law_1.2,0.049721598625183105
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,7168,2048,8,256,16,8,power_law_1.2,0.34124159812927246
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,256,16,8,power_law_1.01,0.8085503578186035
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,7168,2048,8,256,16,8,power_law_1.2,0.05738880038261414
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,7168,2048,8,256,16,8,balanced,2.8313013712565103
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,7168,2048,8,256,16,8,power_law_1.2,0.46790399551391604
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,256,16,8,power_law_1.01,1.0844991683959961
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,7168,2048,8,256,16,8,power_law_1.2,0.06000000238418579
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,7168,2048,8,256,16,8,power_law_1.2,0.6148608207702637
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,7168,2048,8,256,16,8,power_law_1.2,0.06276479959487916
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,256,16,8,power_law_1.01,1.5427712440490722
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,7168,2048,8,256,16,8,power_law_1.2,0.8312895774841309
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,7168,2048,8,256,16,8,power_law_1.2,0.07086079716682434
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,7168,2048,8,256,16,8,power_law_1.2,1.201535987854004
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,256,16,8,power_law_1.01,2.0474624633789062
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,7168,2048,8,256,16,8,power_law_1.2,0.07223680019378662
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,7168,2048,8,256,16,8,power_law_1.2,1.570406436920166
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,256,16,8,power_law_1.01,2.6847871780395507
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,7168,2048,8,256,16,8,power_law_1.2,0.07811200022697448
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,7168,2048,8,256,16,8,power_law_1.2,2.2556735992431642
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,7168,2048,8,256,16,8,power_law_1.2,0.07722880244255066
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,256,16,8,power_law_1.01,4.354444885253907
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,7168,2048,8,256,16,8,power_law_1.2,4.928096008300781
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,7168,2048,8,256,16,8,power_law_1.2,0.07876480221748353
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,256,16,8,power_law_1.01,7.841478729248047
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,7168,2048,8,256,16,8,power_law_1.2,0.08388479948043823
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,7168,2048,8,256,16,8,power_law_1.2,0.08972799777984619
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,7168,2048,8,256,16,8,power_law_1.2,0.09058560132980346
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,7168,2048,8,256,16,8,power_law_1.2,0.10341119766235352
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,7168,2048,8,256,16,8,balanced,3.5437707901000977
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,7168,2048,8,256,16,8,power_law_1.2,0.10999679565429688
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,7168,2048,8,256,16,8,power_law_1.2,0.11518080234527588
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,7168,2048,8,256,16,8,power_law_1.2,0.1419263958930969
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,7168,2048,8,256,16,8,power_law_1.2,0.15004160404205322
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,7168,2048,8,256,16,8,power_law_1.2,0.1855296015739441
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,7168,2048,8,256,16,8,power_law_1.2,0.22572801113128663
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,7168,2048,8,256,16,8,power_law_1.2,0.2868031978607178
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,256,16,8,balanced,5.788656234741211
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,7168,2048,8,256,16,8,power_law_1.2,0.36948480606079104
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,7168,2048,8,256,16,8,power_law_1.2,0.49977598190307615
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,7168,2048,8,256,16,8,power_law_1.2,0.6983871936798096
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,7168,2048,8,256,16,8,power_law_1.2,0.9756352424621582
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,7168,2048,8,256,16,8,power_law_1.2,1.2555904388427734
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,7168,2048,8,256,16,8,power_law_1.2,1.9020288467407227
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,7168,2048,8,256,16,8,power_law_1.2,2.7044416427612306
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,7168,2048,8,256,16,8,power_law_1.2,5.3247425079345705
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,7168,2048,8,256,16,8,power_law_1.2,0.0608959972858429
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,7168,2048,8,256,16,8,power_law_1.2,0.06771199703216553
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,7168,2048,8,256,16,8,power_law_1.2,0.055430400371551516
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,7168,2048,8,256,16,8,power_law_1.2,0.06176000237464905
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,7168,2048,8,256,16,8,power_law_1.2,0.06761599779129028
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,7168,2048,8,256,16,8,power_law_1.2,0.07389439940452576
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,7168,2048,8,256,16,8,power_law_1.2,0.07932159900665284
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,7168,2048,8,256,16,8,power_law_1.2,0.08238720297813415
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,7168,2048,8,256,16,8,power_law_1.2,0.08659200072288513
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,7168,2048,8,256,16,8,power_law_1.2,0.0869376003742218
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,7168,2048,8,256,16,8,power_law_1.2,0.09155200123786926
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,7168,2048,8,256,16,8,power_law_1.2,0.0956928014755249
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,7168,2048,8,256,16,8,power_law_1.2,0.10238720178604126
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,7168,2048,8,256,32,4,balanced,0.05526400109132131
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,7168,2048,8,256,16,8,power_law_1.2,0.1091007947921753
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,7168,2048,8,256,32,4,balanced,0.05657066901524862
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,7168,2048,8,256,16,8,power_law_1.2,0.12469760179519654
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,7168,2048,8,256,32,4,balanced,0.05850133299827576
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,7168,2048,8,256,16,8,power_law_1.2,0.13360639810562133
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,7168,2048,8,256,16,8,power_law_1.2,0.1497663974761963
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,7168,2048,8,256,32,4,balanced,0.07654933134714763
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,7168,2048,8,256,32,4,balanced,0.09291199843088786
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,7168,2048,8,256,16,8,power_law_1.2,0.18507519960403443
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,7168,2048,8,256,32,4,balanced,0.11928000052769978
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,7168,2048,8,256,32,4,balanced,0.12085866928100586
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,7168,2048,8,256,32,4,balanced,0.12285866340001424
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,256,16,8,power_law_1.2,0.2146239995956421
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,7168,2048,8,256,32,4,balanced,0.12363732854525249
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,256,16,8,power_law_1.2,0.28336639404296876
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,7168,2048,8,256,32,4,balanced,0.12298666437466939
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,256,16,8,power_law_1.2,0.3755840063095093
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,7168,2048,8,256,32,4,balanced,0.12504532933235168
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,7168,2048,8,256,32,4,balanced,0.12797333796819052
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,256,16,8,power_law_1.2,0.5315904140472412
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,7168,2048,8,256,32,4,balanced,0.12940266728401184
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,256,16,8,power_law_1.2,0.6401663780212402
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,7168,2048,8,256,32,4,balanced,0.1330880026022593
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,256,16,8,power_law_1.2,0.9750720024108886
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,7168,2048,8,256,32,4,balanced,0.13823999961217245
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,7168,2048,8,256,32,4,balanced,0.1421386698881785
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,256,16,8,power_law_1.2,1.358118438720703
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,7168,2048,8,256,32,4,balanced,0.14301333824793497
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,256,16,8,power_law_1.2,1.7619647979736328
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,7168,2048,8,256,32,4,balanced,0.15387200315793356
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,256,16,8,power_law_1.2,2.6774335861206056
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,7168,2048,8,256,32,4,balanced,0.18615466356277466
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,256,16,8,power_law_1.2,2.9486080169677735
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,7168,2048,8,256,32,4,balanced,0.20362132787704468
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,256,16,8,power_law_1.2,4.576863861083984
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,7168,2048,8,256,32,4,balanced,0.23836799462636313
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,256,16,8,power_law_1.2,9.594355010986328
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,7168,2048,8,256,32,4,balanced,0.048384000857671104
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,7168,2048,8,256,32,4,balanced,0.2939893404642741
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,7168,2048,8,256,32,4,balanced,0.05077866713205973
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,7168,2048,8,256,32,4,balanced,0.05295999844868978
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,7168,2048,8,256,32,4,balanced,0.3600693146387736
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,7168,2048,8,256,32,4,balanced,0.06181333462397257
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,7168,2048,8,256,32,4,balanced,0.07646933197975159
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,7168,2048,8,256,32,4,balanced,0.10499733686447144
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,7168,2048,8,256,32,4,balanced,0.10596266388893127
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,7168,2048,8,256,32,4,balanced,0.5056000153223673
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,7168,2048,8,256,32,4,balanced,0.10760000348091125
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,7168,2048,8,256,32,4,balanced,0.10916800300280254
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,7168,2048,8,256,32,4,power_law_1.01,0.0579584002494812
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,7168,2048,8,256,32,4,balanced,0.10902933279673259
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,7168,2048,8,256,32,4,balanced,0.1092693308989207
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,7168,2048,8,256,32,4,power_law_1.01,0.07249280214309692
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,7168,2048,8,256,32,4,balanced,0.11327999830245972
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,7168,2048,8,256,32,4,power_law_1.01,0.06024320125579834
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,7168,2048,8,256,32,4,balanced,0.6533546845118204
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,7168,2048,8,256,32,4,power_law_1.01,0.07199360132217407
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,7168,2048,8,256,32,4,balanced,0.11513599753379822
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,7168,2048,8,256,32,4,balanced,0.11772800485293071
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,7168,2048,8,256,32,4,power_law_1.01,0.08321279883384705
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,7168,2048,8,256,32,4,balanced,0.12086932857831319
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,7168,2048,8,256,32,4,power_law_1.01,0.09550079703330994
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,7168,2048,8,256,32,4,balanced,0.1291253368059794
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,7168,2048,8,256,32,4,power_law_1.01,0.10391039848327636
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,7168,2048,8,256,32,4,power_law_1.01,0.05160319805145264
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,7168,2048,8,256,32,4,balanced,0.13457600275675455
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,7168,2048,8,256,32,4,power_law_1.01,0.10799360275268555
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,7168,2048,8,256,32,4,balanced,0.9374132951100668
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,7168,2048,8,256,32,4,power_law_1.01,0.11109119653701782
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,7168,2048,8,256,32,4,power_law_1.01,0.06330239772796631
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,7168,2048,8,256,32,4,balanced,0.15158399939537048
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,7168,2048,8,256,32,4,power_law_1.01,0.11260800361633301
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,7168,2048,8,256,32,4,power_law_1.01,0.05552639961242676
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,7168,2048,8,256,32,4,balanced,0.17840532461802164
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,7168,2048,8,256,32,4,power_law_1.01,0.12133760452270508
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,7168,2048,8,256,32,4,power_law_1.01,0.0615231990814209
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,7168,2048,8,256,32,4,balanced,0.21398399273554483
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,7168,2048,8,256,32,4,power_law_1.01,0.12599680423736573
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,7168,2048,8,256,32,4,power_law_1.01,0.07128319740295411
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,7168,2048,8,256,32,4,power_law_1.01,0.08019199967384338
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,7168,2048,8,256,32,4,power_law_1.01,0.1307711958885193
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,7168,2048,8,256,32,4,balanced,0.23810132344563803
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,7168,2048,8,256,32,4,power_law_1.01,0.09137279987335205
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,7168,2048,8,256,32,4,power_law_1.01,0.14383360147476196
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,7168,2048,8,256,32,4,balanced,1.1384320259094238
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,7168,2048,8,256,32,4,power_law_1.01,0.09377920031547546
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,7168,2048,8,256,32,4,power_law_1.01,0.1569408059120178
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,7168,2048,8,256,32,4,balanced,0.30742400884628296
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,7168,2048,8,256,32,4,power_law_1.01,0.09446399807929992
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,7168,2048,8,256,32,4,power_law_1.01,0.16516480445861817
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,7168,2048,8,256,32,4,power_law_1.01,0.09571840167045594
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,7168,2048,8,256,32,4,power_law_1.01,0.1484287977218628
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,7168,2048,8,256,32,4,balanced,0.38920533657073975
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,7168,2048,8,256,32,4,power_law_1.01,0.1010815978050232
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,7168,2048,8,256,32,4,power_law_1.01,0.18617600202560425
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,7168,2048,8,256,32,4,power_law_1.01,0.19032319784164428
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,7168,2048,8,256,32,4,power_law_1.01,0.10581120252609252
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,7168,2048,8,256,32,4,power_law_1.01,0.24135680198669435
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,7168,2048,8,256,32,4,power_law_1.01,0.11067520380020142
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,7168,2048,8,256,32,4,power_law_1.01,0.2677504062652588
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,7168,2048,8,256,32,4,balanced,0.5551253159840902
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,7168,2048,8,256,32,4,power_law_1.01,0.12072960138320923
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,7168,2048,8,256,32,4,power_law_1.01,0.3408639907836914
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,7168,2048,8,256,32,4,power_law_1.01,0.12702080011367797
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,7168,2048,8,256,32,4,power_law_1.01,0.4288320064544678
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,7168,2048,8,256,32,4,balanced,1.530362606048584
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,7168,2048,8,256,32,4,power_law_1.01,0.141484797000885
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,7168,2048,8,256,32,4,power_law_1.01,0.5742591857910156
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,7168,2048,8,256,32,4,power_law_1.01,0.14231040477752685
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,7168,2048,8,256,32,4,balanced,0.7172213395436605
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,7168,2048,8,256,32,4,power_law_1.01,0.17448960542678832
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,7168,2048,8,256,32,4,power_law_1.01,0.7704063892364502
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,7168,2048,8,256,32,4,power_law_1.01,0.1941696047782898
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,7168,2048,8,256,32,4,power_law_1.01,1.165932846069336
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,7168,2048,8,256,32,4,power_law_1.2,0.05785599946975708
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,7168,2048,8,256,32,4,power_law_1.01,0.24710400104522706
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,7168,2048,8,256,32,4,power_law_1.01,1.368447971343994
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,7168,2048,8,256,32,4,power_law_1.2,0.06600319743156433
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,7168,2048,8,256,32,4,power_law_1.01,0.28063359260559084
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,7168,2048,8,256,32,4,power_law_1.01,1.695052719116211
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,7168,2048,8,256,32,4,power_law_1.2,0.0580735981464386
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,7168,2048,8,256,32,4,power_law_1.01,0.37310080528259276
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,7168,2048,8,256,32,4,balanced,1.041103998819987
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,7168,2048,8,256,32,4,power_law_1.2,0.06702079772949218
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,7168,2048,8,256,32,4,power_law_1.01,2.4657215118408202
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,7168,2048,8,256,32,4,power_law_1.01,0.4457727909088135
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,7168,2048,8,256,32,4,power_law_1.2,0.07519360184669495
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,7168,2048,8,256,32,4,power_law_1.01,0.6370175838470459
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,7168,2048,8,256,32,4,power_law_1.01,5.494009780883789
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,7168,2048,8,256,32,4,power_law_1.2,0.08737919926643371
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,7168,2048,8,256,32,4,power_law_1.01,0.8133631706237793
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,7168,2048,8,256,32,4,power_law_1.2,0.10576640367507935
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,7168,2048,8,256,32,4,power_law_1.2,0.10539519786834717
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,7168,2048,8,256,32,4,power_law_1.01,1.1526975631713867
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,7168,2048,8,256,32,4,balanced,2.151631991068522
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,7168,2048,8,256,32,4,power_law_1.2,0.10949120521545411
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,7168,2048,8,256,32,4,power_law_1.01,1.519987201690674
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,7168,2048,8,256,32,4,power_law_1.2,0.11311999559402466
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,7168,2048,8,256,32,4,balanced,1.2990453243255615
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,7168,2048,8,256,32,4,power_law_1.01,1.9274688720703126
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,7168,2048,8,256,32,4,power_law_1.2,0.12117120027542114
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,7168,2048,8,256,32,4,power_law_1.01,2.92238712310791
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,7168,2048,8,256,32,4,power_law_1.2,0.12604160308837892
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,7168,2048,8,256,32,4,power_law_1.2,0.13115520477294923
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,7168,2048,8,256,32,4,power_law_1.01,5.891686248779297
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,7168,2048,8,256,32,4,power_law_1.2,0.14941439628601075
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,7168,2048,8,256,32,4,power_law_1.2,0.16191359758377075
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,7168,2048,8,256,32,4,power_law_1.2,0.16647679805755616
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,7168,2048,8,256,32,4,power_law_1.2,0.15088000297546386
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,7168,2048,8,256,32,4,balanced,1.6982080141703289
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,7168,2048,8,256,32,4,power_law_1.2,0.18896640539169313
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,7168,2048,8,256,32,4,power_law_1.2,0.20257279872894288
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,7168,2048,8,256,32,4,power_law_1.2,0.24522879123687744
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,7168,2048,8,256,32,4,power_law_1.2,0.27539839744567873
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,7168,2048,8,256,32,4,power_law_1.2,0.3732800006866455
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,7168,2048,8,256,32,4,power_law_1.2,0.46047358512878417
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,7168,2048,8,256,32,4,power_law_1.2,0.6069119930267334
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,7168,2048,8,256,32,4,power_law_1.2,0.7898047924041748
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,7168,2048,8,256,32,4,power_law_1.2,1.2084927558898926
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,7168,2048,8,256,32,4,power_law_1.2,1.3711551666259765
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,7168,2048,8,256,32,4,power_law_1.2,1.788332748413086
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,7168,2048,8,256,32,4,balanced,2.5308693250020347
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,7168,2048,8,256,32,4,power_law_1.2,2.9318592071533205
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,7168,2048,8,256,32,4,balanced,4.242517471313477
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,7168,2048,8,256,32,4,power_law_1.2,6.273932647705078
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,7168,2048,8,256,32,4,power_law_1.2,0.05185279846191406
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,7168,2048,8,256,32,4,power_law_1.2,0.06332799792289734
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,7168,2048,8,256,32,4,power_law_1.2,0.052262401580810545
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,7168,2048,8,256,32,4,power_law_1.2,0.06139519810676575
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,7168,2048,8,256,32,4,power_law_1.2,0.06863359808921814
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,7168,2048,8,256,32,4,power_law_1.2,0.0775551974773407
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,7168,2048,8,256,32,4,power_law_1.2,0.08654720187187195
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,7168,2048,8,256,32,4,power_law_1.2,0.09294080138206481
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,7168,2048,8,256,32,4,power_law_1.2,0.09297919869422913
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,7168,2048,8,256,32,4,power_law_1.2,0.09448959827423095
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,7168,2048,8,256,32,4,power_law_1.2,0.10117119550704956
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,7168,2048,8,256,32,4,power_law_1.2,0.10636160373687745
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,7168,2048,8,256,32,4,power_law_1.2,0.10926719903945922
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,7168,2048,8,256,32,4,power_law_1.2,0.11890560388565063
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,7168,2048,8,256,32,4,power_law_1.2,0.12935680150985718
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,7168,2048,8,256,32,4,power_law_1.2,0.14162559509277345
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,7168,2048,8,256,32,4,power_law_1.2,0.1471743941307068
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,7168,2048,8,256,32,4,power_law_1.2,0.18065919876098632
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,7168,2048,8,256,32,4,power_law_1.2,0.19374719858169556
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,7168,2048,8,256,32,4,power_law_1.2,0.25508480072021483
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,7168,2048,8,256,32,4,balanced,5.006784121195476
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,7168,2048,8,256,32,4,power_law_1.2,0.28936960697174074
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,7168,2048,8,256,32,4,power_law_1.2,0.3726975917816162
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,7168,2048,8,256,32,4,power_law_1.2,0.47075839042663575
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,7168,2048,8,256,32,4,power_law_1.2,0.617471981048584
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,7168,2048,8,256,32,4,power_law_1.2,0.8761343955993652
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,7168,2048,8,256,32,4,power_law_1.2,1.236575984954834
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,7168,2048,8,256,32,4,power_law_1.2,1.643391990661621
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,7168,2048,8,256,32,4,power_law_1.2,1.9423871994018556
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,7168,2048,8,256,32,4,power_law_1.2,3.2977855682373045
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,7168,2048,8,256,32,4,power_law_1.2,7.272889709472656
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,2048,768,8,128,1,128,balanced,0.04032533367474874
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,2048,768,8,128,1,128,balanced,0.04088533421357473
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,2048,768,8,128,1,128,balanced,0.03597866743803024
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,2048,768,8,128,1,128,balanced,0.041637333730856575
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,2048,768,8,128,1,128,balanced,0.042634665966033936
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,2048,768,8,128,1,128,balanced,0.0365280012289683
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,2048,768,8,128,1,128,balanced,0.04362666606903076
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,2048,768,8,128,1,128,balanced,0.04479999840259552
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,2048,768,8,128,1,128,balanced,0.03526933242877325
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,2048,768,8,128,1,128,balanced,0.04604266583919525
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,2048,768,8,128,1,128,balanced,0.03750933210055033
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,2048,768,8,128,1,128,balanced,0.04465599854787191
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,2048,768,8,128,1,128,balanced,0.03815466662247976
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,2048,768,8,128,1,128,balanced,0.04375466704368591
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,2048,768,8,128,1,128,balanced,0.03939199944337209
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,2048,768,8,128,1,128,balanced,0.04513599971930186
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,2048,768,8,128,1,128,balanced,0.0399893323580424
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,2048,768,8,128,1,128,balanced,0.042394667863845825
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,2048,768,8,128,1,128,balanced,0.03958933303753535
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,2048,768,8,128,1,128,balanced,0.0420959989229838
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,2048,768,8,128,1,128,balanced,0.03915199885765711
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,2048,768,8,128,1,128,balanced,0.042624001701672874
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,2048,768,8,128,1,128,balanced,0.04539200166861216
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,2048,768,8,128,1,128,balanced,0.03994133323431015
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,2048,768,8,128,1,128,balanced,0.04729066789150238
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,2048,768,8,128,1,128,balanced,0.03984000037113825
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,2048,768,8,128,1,128,balanced,0.0480373352766037
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,2048,768,8,128,1,128,balanced,0.04050133377313614
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,2048,768,8,128,1,128,balanced,0.04702933132648468
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,2048,768,8,128,1,128,balanced,0.03988266736268997
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,2048,768,8,128,1,128,balanced,0.04566933214664459
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,2048,768,8,128,1,128,balanced,0.03988266736268997
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,2048,768,8,128,1,128,balanced,0.047007997830708824
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,2048,768,8,128,1,128,balanced,0.04384533564249674
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,2048,768,8,128,1,128,balanced,0.045269335309664406
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,2048,768,8,128,1,128,balanced,0.043098668257395424
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,2048,768,8,128,1,128,balanced,0.04364799956480662
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,2048,768,8,128,1,128,balanced,0.02292799949645996
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,2048,768,8,128,1,128,balanced,0.04418133199214935
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,2048,768,8,128,1,128,balanced,0.022704000274340313
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,2048,768,8,128,1,128,balanced,0.044693330923716225
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,2048,768,8,128,1,128,balanced,0.059717332323392235
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,2048,768,8,128,1,128,balanced,0.022848000129063923
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,2048,768,8,128,1,128,balanced,0.0451200008392334
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,2048,768,8,128,1,128,balanced,0.024058667321999867
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,2048,768,8,128,1,128,balanced,0.060218666990598045
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,2048,768,8,128,1,128,balanced,0.02515200028816859
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,2048,768,8,128,1,128,balanced,0.047498668233553566
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,2048,768,8,128,1,128,balanced,0.02585600068171819
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,2048,768,8,128,1,128,balanced,0.02621866762638092
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,2048,768,8,128,1,128,balanced,0.049285332361857094
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,2048,768,8,128,1,128,balanced,0.0765226682027181
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,2048,768,8,128,1,128,balanced,0.026122666895389557
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,2048,768,8,128,1,128,balanced,0.02621866762638092
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,2048,768,8,128,1,128,balanced,0.06682666639486949
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,2048,768,8,128,1,128,balanced,0.027280000348885853
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,2048,768,8,128,1,128,balanced,0.027136000494162243
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,2048,768,8,128,1,128,balanced,0.08588799834251404
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,2048,768,8,128,1,128,balanced,0.027434666951497395
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,2048,768,8,128,1,128,balanced,0.07541866600513458
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,2048,768,8,128,1,128,balanced,0.02808533360560735
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,2048,768,8,128,1,128,balanced,0.02864533414443334
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,2048,768,8,128,1,128,balanced,0.030762667457262676
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,2048,768,8,128,1,128,balanced,0.03019733230272929
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,2048,768,8,128,1,128,balanced,0.09949333469072978
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,2048,768,8,128,1,128,power_law_1.01,0.03930239975452423
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,2048,768,8,128,1,128,balanced,0.11985066533088684
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,2048,768,8,128,1,128,power_law_1.01,0.03370240032672882
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,2048,768,8,128,1,128,power_law_1.01,0.039468801021575926
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,2048,768,8,128,1,128,power_law_1.01,0.03973760008811951
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,2048,768,8,128,1,128,power_law_1.01,0.03400320112705231
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,2048,768,8,128,1,128,power_law_1.01,0.04019840061664581
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,2048,768,8,128,1,128,power_law_1.01,0.033529600501060484
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,2048,768,8,128,1,128,balanced,0.03128000100453695
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,2048,768,8,128,1,128,power_law_1.01,0.041817599534988405
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,2048,768,8,128,1,128,balanced,0.1165120005607605
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,2048,768,8,128,1,128,power_law_1.01,0.035519999265670774
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,2048,768,8,128,1,128,power_law_1.01,0.04268159866333008
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,2048,768,8,128,1,128,balanced,0.03274133304754893
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,2048,768,8,128,1,128,power_law_1.01,0.04188160002231598
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,2048,768,8,128,1,128,power_law_1.01,0.03606399893760681
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,2048,768,8,128,1,128,power_law_1.01,0.04217599928379059
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,2048,768,8,128,1,128,power_law_1.01,0.0367935985326767
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,2048,768,8,128,1,128,balanced,0.03195200115442276
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,2048,768,8,128,1,128,power_law_1.01,0.04182400107383728
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,2048,768,8,128,1,128,power_law_1.01,0.03874559998512268
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,2048,768,8,128,1,128,power_law_1.01,0.04005120098590851
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,2048,768,8,128,1,128,power_law_1.01,0.038540801405906676
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,2048,768,8,128,1,128,power_law_1.01,0.042156800627708435
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,2048,768,8,128,1,128,balanced,0.14390400052070618
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,2048,768,8,128,1,128,power_law_1.01,0.03840000033378601
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,2048,768,8,128,1,128,power_law_1.01,0.03950720131397247
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,2048,768,8,128,1,128,balanced,0.15819733341534933
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,2048,768,8,128,1,128,power_law_1.01,0.03886080086231232
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,2048,768,8,128,1,128,power_law_1.01,0.040940800309181215
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,2048,768,8,128,1,128,power_law_1.01,0.039059200882911684
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,2048,768,8,128,1,128,power_law_1.01,0.039743998646736146
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,2048,768,8,128,1,128,power_law_1.01,0.039724799990653994
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,2048,768,8,128,1,128,power_law_1.01,0.03865599930286408
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,2048,768,8,128,1,128,balanced,0.03639466563860575
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,2048,768,8,128,1,128,power_law_1.01,0.04074879884719849
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,2048,768,8,128,1,128,power_law_1.01,0.03870719969272614
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,2048,768,8,128,1,128,power_law_1.01,0.050374400615692136
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,2048,768,8,128,1,128,power_law_1.01,0.03828479945659637
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,2048,768,8,128,1,128,balanced,0.03709333389997482
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,2048,768,8,128,1,128,power_law_1.01,0.05952640175819397
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,2048,768,8,128,1,128,power_law_1.01,0.038924801349639895
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,2048,768,8,128,1,128,power_law_1.01,0.0652351975440979
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,2048,768,8,128,1,128,power_law_1.01,0.04602240025997162
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,2048,768,8,128,1,128,power_law_1.01,0.07728000283241272
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,2048,768,8,128,1,128,power_law_1.01,0.09294080138206481
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,2048,768,8,128,1,128,power_law_1.01,0.04758400022983551
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,2048,768,8,128,1,128,power_law_1.01,0.13318400382995604
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,2048,768,8,128,1,128,balanced,0.1962719957033793
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,2048,768,8,128,1,128,power_law_1.01,0.05241600275039673
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,2048,768,8,128,1,128,balanced,0.17620267470677695
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,2048,768,8,128,1,128,power_law_1.01,0.17860480546951293
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,2048,768,8,128,1,128,power_law_1.01,0.05630720257759094
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,2048,768,8,128,1,128,power_law_1.01,0.23828480243682862
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,2048,768,8,128,1,128,power_law_1.01,0.07190399765968322
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,2048,768,8,128,1,128,balanced,0.04344533383846283
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,2048,768,8,128,1,128,power_law_1.01,0.3178368091583252
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,2048,768,8,128,1,128,power_law_1.01,0.08094080090522766
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,2048,768,8,128,1,128,power_law_1.01,0.49993600845336916
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,2048,768,8,128,1,128,power_law_1.01,0.12550400495529174
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,2048,768,8,128,1,128,power_law_1.01,0.6525375843048096
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,2048,768,8,128,1,128,power_law_1.01,0.1404031991958618
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,2048,768,8,128,1,128,balanced,0.04669333497683207
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,2048,768,8,128,1,128,power_law_1.01,0.771289587020874
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,2048,768,8,128,1,128,power_law_1.01,0.225164794921875
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,2048,768,8,128,1,128,power_law_1.01,1.2806528091430665
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,2048,768,8,128,1,128,power_law_1.01,0.2533247947692871
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,2048,768,8,128,1,128,power_law_1.01,0.3791039943695068
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,2048,768,8,128,1,128,power_law_1.01,2.7091007232666016
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,2048,768,8,128,1,128,power_law_1.01,0.5062335968017578
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,2048,768,8,128,1,128,balanced,0.23586666584014893
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,2048,768,8,128,1,128,power_law_1.01,0.022233599424362184
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,2048,768,8,128,1,128,power_law_1.01,0.5786240100860596
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,2048,768,8,128,1,128,power_law_1.01,0.022041599452495574
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,2048,768,8,128,1,128,power_law_1.01,1.0679295539855957
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,2048,768,8,128,1,128,power_law_1.01,0.022316800057888032
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,2048,768,8,128,1,128,balanced,0.06035733222961426
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,2048,768,8,128,1,128,power_law_1.01,0.02399359941482544
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,2048,768,8,128,1,128,power_law_1.01,2.0515647888183595
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,2048,768,8,128,1,128,power_law_1.01,0.02456959933042526
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,2048,768,8,128,1,128,balanced,0.2600586613019307
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,2048,768,8,128,1,128,power_law_1.01,0.02539519965648651
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,2048,768,8,128,1,128,power_law_1.01,0.02590720057487488
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,2048,768,8,128,1,128,power_law_1.01,0.02602880001068115
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,2048,768,8,128,1,128,power_law_1.01,0.02622720003128052
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,2048,768,8,128,1,128,power_law_1.01,0.026572799682617186
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,2048,768,8,128,1,128,balanced,0.06985066831111908
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,2048,768,8,128,1,128,power_law_1.01,0.02705279886722565
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,2048,768,8,128,1,128,power_law_1.2,0.04017919898033142
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,2048,768,8,128,1,128,power_law_1.01,0.02754560112953186
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,2048,768,8,128,1,128,power_law_1.2,0.040575999021530154
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,2048,768,8,128,1,128,balanced,0.3537866671880086
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,2048,768,8,128,1,128,power_law_1.01,0.02775680124759674
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,2048,768,8,128,1,128,power_law_1.2,0.04145280122756958
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,2048,768,8,128,1,128,power_law_1.01,0.029216000437736513
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,2048,768,8,128,1,128,power_law_1.2,0.04156799912452698
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,2048,768,8,128,1,128,power_law_1.01,0.03150080144405365
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,2048,768,8,128,1,128,power_law_1.2,0.04261760115623474
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,2048,768,8,128,1,128,power_law_1.01,0.03364480137825012
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,2048,768,8,128,1,128,power_law_1.2,0.04376319944858551
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,2048,768,8,128,1,128,power_law_1.2,0.0435263991355896
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,2048,768,8,128,1,128,power_law_1.01,0.04288640022277832
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,2048,768,8,128,1,128,power_law_1.2,0.04284160137176514
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,2048,768,8,128,1,128,power_law_1.2,0.04178560078144074
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,2048,768,8,128,1,128,power_law_1.01,0.050342398881912234
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,2048,768,8,128,1,128,balanced,0.0923466682434082
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,2048,768,8,128,1,128,power_law_1.2,0.042310398817062375
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,2048,768,8,128,1,128,power_law_1.01,0.054502397775650024
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,2048,768,8,128,1,128,power_law_1.2,0.04085119962692261
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,2048,768,8,128,1,128,power_law_1.2,0.03591679930686951
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,2048,768,8,128,1,128,power_law_1.2,0.038771200180053714
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,2048,768,8,128,1,128,power_law_1.01,0.06593919992446899
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,2048,768,8,128,1,128,power_law_1.2,0.03518719971179962
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,2048,768,8,128,1,128,power_law_1.2,0.037913599610328676
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,2048,768,8,128,1,128,power_law_1.01,0.08261759877204895
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,2048,768,8,128,1,128,power_law_1.2,0.03384959995746613
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,2048,768,8,128,1,128,power_law_1.2,0.045484799146652224
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,2048,768,8,128,1,128,power_law_1.2,0.03720960021018982
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,2048,768,8,128,1,128,power_law_1.2,0.05234559774398804
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,2048,768,8,128,1,128,power_law_1.2,0.03697920143604279
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,2048,768,8,128,1,128,power_law_1.2,0.05053439736366272
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,2048,768,8,128,1,128,power_law_1.01,0.09430400133132935
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,2048,768,8,128,1,128,power_law_1.2,0.039212799072265624
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,2048,768,8,128,1,128,power_law_1.2,0.052198398113250735
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,2048,768,8,128,1,128,power_law_1.01,0.12239359617233277
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,2048,768,8,128,1,128,power_law_1.2,0.06328319907188415
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,2048,768,8,128,1,128,power_law_1.2,0.03900800049304962
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,2048,768,8,128,1,128,balanced,0.48790931701660156
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,2048,768,8,128,1,128,balanced,0.11231467127799988
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,2048,768,8,128,1,128,power_law_1.2,0.038624000549316403
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,2048,768,8,128,1,128,power_law_1.2,0.08771839737892151
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,2048,768,8,128,1,128,power_law_1.01,0.15569920539855958
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,2048,768,8,128,1,128,power_law_1.2,0.10239360332489014
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,2048,768,8,128,1,128,power_law_1.2,0.03845759928226471
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,2048,768,8,128,1,128,power_law_1.2,0.0378495991230011
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,2048,768,8,128,1,128,power_law_1.2,0.1348479986190796
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,2048,768,8,128,1,128,power_law_1.01,0.20019838809967042
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,2048,768,8,128,1,128,power_law_1.2,0.039526399970054624
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,2048,768,8,128,1,128,power_law_1.2,0.19115519523620605
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,2048,768,8,128,1,128,power_law_1.2,0.03743360042572021
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,2048,768,8,128,1,128,power_law_1.2,0.24732799530029298
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,2048,768,8,128,1,128,power_law_1.2,0.03849599957466125
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,2048,768,8,128,1,128,power_law_1.01,0.2931648015975952
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,2048,768,8,128,1,128,power_law_1.2,0.32892799377441406
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,2048,768,8,128,1,128,balanced,0.6724426746368408
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,2048,768,8,128,1,128,power_law_1.2,0.037894400954246524
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,2048,768,8,128,1,128,power_law_1.2,0.4960768222808838
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,2048,768,8,128,1,128,power_law_1.2,0.04451839923858643
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,2048,768,8,128,1,128,power_law_1.01,0.38567678928375243
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,2048,768,8,128,1,128,power_law_1.2,0.725657606124878
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,2048,768,8,128,1,128,power_law_1.2,0.04636160135269165
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,2048,768,8,128,1,128,power_law_1.2,0.9341888427734375
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,2048,768,8,128,1,128,power_law_1.2,0.04556800127029419
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,2048,768,8,128,1,128,power_law_1.2,1.2043840408325195
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,2048,768,8,128,1,128,power_law_1.2,0.05497599840164184
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,2048,768,8,128,1,128,power_law_1.2,0.06460800170898437
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,2048,768,8,128,1,128,balanced,0.13430399696032205
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,2048,768,8,128,1,128,power_law_1.2,1.9355455398559571
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,2048,768,8,128,1,128,power_law_1.01,0.499724817276001
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,2048,768,8,128,1,128,power_law_1.2,0.08275840282440186
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,2048,768,8,128,1,128,power_law_1.01,0.9066816329956054
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,2048,768,8,128,1,128,power_law_1.2,3.911840057373047
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,2048,768,8,128,1,128,power_law_1.2,0.10968960523605346
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,2048,768,8,128,1,128,power_law_1.2,0.15232640504837036
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,2048,768,8,128,1,128,power_law_1.01,1.592262363433838
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,2048,768,8,128,1,128,power_law_1.2,0.19095040559768678
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,2048,768,8,128,1,128,power_law_1.2,0.3073728084564209
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,2048,768,8,128,1,128,power_law_1.2,0.38246400356292726
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,2048,768,8,128,1,128,power_law_1.2,0.5581696033477783
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,2048,768,8,128,1,128,power_law_1.2,0.7792768001556396
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,2048,768,8,128,1,128,power_law_1.2,0.9631104469299316
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,2048,768,8,128,1,128,power_law_1.2,1.5103679656982423
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,2048,768,8,128,1,128,balanced,0.19965332746505737
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,2048,768,8,128,1,128,power_law_1.2,2.9840768814086913
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,2048,768,8,128,2,64,balanced,0.02271999915440877
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,2048,768,8,128,2,64,balanced,0.02613866577545802
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,2048,768,8,128,2,64,balanced,0.02266666789849599
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,2048,768,8,128,2,64,balanced,0.023823998868465424
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,2048,768,8,128,1,128,power_law_1.2,0.021958400309085847
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,2048,768,8,128,1,128,balanced,0.36793065071105957
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,2048,768,8,128,2,64,balanced,0.024133334557215374
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,2048,768,8,128,1,128,power_law_1.2,0.02195200026035309
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,2048,768,8,128,2,64,balanced,0.025413334369659424
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,2048,768,8,128,1,128,power_law_1.2,0.022336000204086305
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,2048,768,8,128,2,64,balanced,0.02632533262173335
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,2048,768,8,128,1,128,power_law_1.2,0.024083200097084045
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,2048,768,8,128,2,64,balanced,0.025813333690166473
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,2048,768,8,128,1,128,power_law_1.2,0.024607999622821806
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,2048,768,8,128,2,64,balanced,0.02571733295917511
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,2048,768,8,128,1,128,power_law_1.2,0.025382399559020996
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,2048,768,8,128,2,64,balanced,0.026357332865397137
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,2048,768,8,128,1,128,power_law_1.2,0.026060798764228822
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,2048,768,8,128,2,64,balanced,0.026789332429567974
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,2048,768,8,128,1,128,power_law_1.2,0.025990399718284606
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,2048,768,8,128,2,64,balanced,0.02696000039577484
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,2048,768,8,128,1,128,power_law_1.2,0.026233598589897156
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,2048,768,8,128,2,64,balanced,0.027850667635599773
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,2048,768,8,128,1,128,power_law_1.2,0.02632960081100464
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,2048,768,8,128,2,64,balanced,0.03422933320204417
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,2048,768,8,128,1,128,power_law_1.2,0.02736000120639801
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,2048,768,8,128,2,64,balanced,0.03566933423280716
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,2048,768,8,128,1,128,power_law_1.2,0.02768000066280365
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,2048,768,8,128,2,64,balanced,0.03603733330965042
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,2048,768,8,128,1,128,power_law_1.2,0.028428798913955687
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,2048,768,8,128,2,64,balanced,0.03694933404525121
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,2048,768,8,128,1,128,power_law_1.2,0.0297791987657547
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,2048,768,8,128,2,64,balanced,0.037946666280428566
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,2048,768,8,128,1,128,power_law_1.2,0.03325439989566803
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,2048,768,8,128,1,128,power_law_1.2,0.037529599666595456
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,2048,768,8,128,2,64,balanced,0.03900266687075297
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,2048,768,8,128,2,64,balanced,0.041690667470296226
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,2048,768,8,128,1,128,power_law_1.2,0.04734080135822296
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,2048,768,8,128,2,64,balanced,0.04195733368396759
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,2048,768,8,128,1,128,power_law_1.2,0.06514559984207154
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,2048,768,8,128,2,64,balanced,0.02998399982849757
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,2048,768,8,128,1,128,power_law_1.2,0.07249919772148132
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,2048,768,8,128,2,64,balanced,0.028597332537174225
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,2048,768,8,128,2,64,balanced,0.028901333610216778
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,2048,768,8,128,2,64,balanced,0.04964800179004669
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,2048,768,8,128,2,64,balanced,0.03073066721359889
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,2048,768,8,128,2,64,balanced,0.0337119996547699
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,2048,768,8,128,1,128,power_law_1.2,0.08781440258026123
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,2048,768,8,128,2,64,balanced,0.033359999457995095
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,2048,768,8,128,2,64,balanced,0.04764799773693085
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,2048,768,8,128,2,64,balanced,0.03320533285538355
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,2048,768,8,128,1,128,power_law_1.2,0.11200640201568604
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,2048,768,8,128,2,64,balanced,0.03325333446264267
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,2048,768,8,128,2,64,balanced,0.03323200096686681
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,2048,768,8,128,2,64,balanced,0.03404266635576884
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,2048,768,8,128,1,128,power_law_1.2,0.14212479591369628
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,2048,768,8,128,2,64,balanced,0.03412266572316488
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,2048,768,8,128,2,64,balanced,0.06084799766540527
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,2048,768,8,128,2,64,balanced,0.03454933315515518
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,2048,768,8,128,1,128,power_law_1.2,0.18954880237579347
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,2048,768,8,128,2,64,balanced,0.03513599932193756
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,2048,768,8,128,2,64,balanced,0.03624533365170161
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,2048,768,8,128,2,64,balanced,0.03826133410135905
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,2048,768,8,128,1,128,power_law_1.2,0.24569599628448485
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,2048,768,8,128,2,64,balanced,0.0376800000667572
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,2048,768,8,128,2,64,balanced,0.06145599981149038
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,2048,768,8,128,2,64,balanced,0.038805333276589714
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,2048,768,8,128,2,64,balanced,0.0397173340121905
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,2048,768,8,128,1,128,power_law_1.2,0.3287935972213745
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,2048,768,8,128,2,64,balanced,0.040922666589419045
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,2048,768,8,128,2,64,balanced,0.043605332573254905
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,2048,768,8,128,2,64,balanced,0.02235200007756551
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,2048,768,8,128,1,128,power_law_1.2,0.4769536018371582
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,2048,768,8,128,2,64,power_law_1.01,0.02247679978609085
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,2048,768,8,128,2,64,balanced,0.04632533093293508
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,2048,768,8,128,2,64,balanced,0.02250133454799652
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,2048,768,8,128,2,64,balanced,0.08055466910203297
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,2048,768,8,128,2,64,balanced,0.022442666192849476
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,2048,768,8,128,2,64,power_law_1.01,0.026476800441741943
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,2048,768,8,128,2,64,balanced,0.05866133173306783
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,2048,768,8,128,1,128,power_law_1.2,0.5933248043060303
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,2048,768,8,128,2,64,balanced,0.023792001108328503
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,2048,768,8,128,2,64,power_law_1.01,0.022047999501228332
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,2048,768,8,128,2,64,balanced,0.025226667523384094
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,2048,768,8,128,2,64,power_law_1.01,0.023603199422359465
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,2048,768,8,128,2,64,balanced,0.02613866577545802
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,2048,768,8,128,2,64,balanced,0.06569066643714905
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,2048,768,8,128,2,64,power_law_1.01,0.024006399512290954
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,2048,768,8,128,2,64,balanced,0.02624533325433731
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,2048,768,8,128,1,128,power_law_1.2,0.7583807945251465
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,2048,768,8,128,2,64,balanced,0.026261332134405773
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,2048,768,8,128,2,64,power_law_1.01,0.025017601251602174
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,2048,768,8,128,1,128,power_law_1.2,1.2038335800170898
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,2048,768,8,128,2,64,balanced,0.02641066660483678
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,2048,768,8,128,2,64,power_law_1.01,0.025254398584365845
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,2048,768,8,128,2,64,balanced,0.08619200189908345
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,2048,768,8,128,2,64,balanced,0.027130665878454845
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,2048,768,8,128,2,64,power_law_1.01,0.024825599789619446
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,2048,768,8,128,2,64,power_law_1.01,0.031590399146080014
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,2048,768,8,128,2,64,balanced,0.08708266417185466
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,2048,768,8,128,1,128,power_law_1.2,2.3368831634521485
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,2048,768,8,128,2,64,balanced,0.02741866558790207
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,2048,768,8,128,2,64,power_law_1.01,0.028403198719024657
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,2048,768,8,128,2,64,power_law_1.01,0.02967039942741394
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,2048,768,8,128,2,64,balanced,0.027503999571005504
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,2048,768,8,128,2,64,power_law_1.01,0.031020799279212953
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,2048,768,8,128,2,64,balanced,0.02864533414443334
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,2048,768,8,128,2,64,power_law_1.01,0.0285504013299942
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,2048,768,8,128,2,64,balanced,0.09800533453623454
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,2048,768,8,128,2,64,power_law_1.01,0.03200640082359314
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,2048,768,8,128,2,64,balanced,0.02867199977238973
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,2048,768,8,128,2,64,power_law_1.01,0.03144319951534271
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,2048,768,8,128,2,64,power_law_1.01,0.032671999931335446
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,2048,768,8,128,2,64,power_law_1.01,0.03188480138778686
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,2048,768,8,128,2,64,balanced,0.031045332551002502
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,2048,768,8,128,2,64,power_law_1.01,0.03283840119838714
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,2048,768,8,128,2,64,power_law_1.01,0.032793599367141726
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,2048,768,8,128,2,64,balanced,0.030602666238943737
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,2048,768,8,128,2,64,power_law_1.01,0.034220799803733826
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,2048,768,8,128,2,64,power_law_1.01,0.03475199937820435
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,2048,768,8,128,2,64,balanced,0.13014933466911316
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,2048,768,8,128,2,64,power_law_1.01,0.03653759956359863
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,2048,768,8,128,2,64,power_law_1.01,0.03320319950580597
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,2048,768,8,128,2,64,balanced,0.09949866930643718
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,2048,768,8,128,2,64,power_law_1.01,0.037625598907470706
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,2048,768,8,128,2,64,power_law_1.01,0.03330560028553009
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,2048,768,8,128,2,64,power_law_1.01,0.02232320010662079
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,2048,768,8,128,2,64,balanced,0.03150933235883713
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,2048,768,8,128,2,64,power_law_1.01,0.04010879993438721
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,2048,768,8,128,2,64,power_law_1.01,0.03380480110645294
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,2048,768,8,128,2,64,power_law_1.01,0.022111999988555908
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,2048,768,8,128,2,64,balanced,0.03359466542800268
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,2048,768,8,128,2,64,power_law_1.01,0.04237439930438995
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,2048,768,8,128,2,64,power_law_1.01,0.03442560136318207
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,2048,768,8,128,2,64,power_law_1.01,0.022303999960422517
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,2048,768,8,128,2,64,power_law_1.01,0.04802559912204742
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,2048,768,8,128,2,64,power_law_1.01,0.035097599029541016
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,2048,768,8,128,2,64,balanced,0.033013333876927696
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,2048,768,8,128,2,64,power_law_1.01,0.06632320284843445
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,2048,768,8,128,2,64,power_law_1.01,0.02418559938669205
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,2048,768,8,128,2,64,power_law_1.01,0.035359999537467955
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,2048,768,8,128,2,64,balanced,0.154831995566686
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,2048,768,8,128,2,64,power_law_1.01,0.02494720071554184
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,2048,768,8,128,2,64,power_law_1.01,0.06660479903221131
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,2048,768,8,128,2,64,power_law_1.01,0.0374208003282547
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,2048,768,8,128,2,64,power_law_1.01,0.025804799795150758
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,2048,768,8,128,2,64,power_law_1.01,0.09043840169906617
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,2048,768,8,128,2,64,power_law_1.01,0.03941119909286499
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,2048,768,8,128,2,64,power_law_1.01,0.026086398959159852
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,2048,768,8,128,2,64,power_law_1.01,0.04007039964199066
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,2048,768,8,128,2,64,power_law_1.01,0.08947839736938476
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,2048,768,8,128,2,64,balanced,0.03761066744724909
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,2048,768,8,128,2,64,power_law_1.01,0.02643199861049652
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,2048,768,8,128,2,64,power_law_1.01,0.042668798565864564
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,2048,768,8,128,2,64,power_law_1.01,0.12346240282058715
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,2048,768,8,128,2,64,power_law_1.01,0.026470398902893065
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,2048,768,8,128,2,64,balanced,0.03897066662708918
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,2048,768,8,128,2,64,power_law_1.01,0.0460671991109848
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,2048,768,8,128,2,64,power_law_1.01,0.11207679510116578
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,2048,768,8,128,2,64,power_law_1.01,0.02733440101146698
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,2048,768,8,128,2,64,power_law_1.01,0.04792320132255554
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,2048,768,8,128,2,64,power_law_1.01,0.20227839946746826
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,2048,768,8,128,2,64,power_law_1.01,0.027475199103355406
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,2048,768,8,128,2,64,power_law_1.01,0.05836799740791321
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,2048,768,8,128,2,64,power_law_1.01,0.0278656005859375
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,2048,768,8,128,2,64,power_law_1.01,0.2227776050567627
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,2048,768,8,128,2,64,power_law_1.01,0.06474879980087281
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,2048,768,8,128,2,64,balanced,0.1383840044339498
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,2048,768,8,128,2,64,power_law_1.01,0.02913280129432678
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,2048,768,8,128,2,64,balanced,0.18259199460347494
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,2048,768,8,128,2,64,power_law_1.01,0.27351040840148927
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,2048,768,8,128,2,64,power_law_1.01,0.09409279823303222
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,2048,768,8,128,2,64,power_law_1.01,0.029836800694465638
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,2048,768,8,128,2,64,balanced,0.04646400113900503
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,2048,768,8,128,2,64,power_law_1.01,0.407916784286499
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,2048,768,8,128,2,64,power_law_1.01,0.10582400560379028
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,2048,768,8,128,2,64,power_law_1.01,0.03317759931087494
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,2048,768,8,128,2,64,power_law_1.01,0.1334720015525818
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,2048,768,8,128,2,64,power_law_1.01,0.03402880132198334
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,2048,768,8,128,2,64,power_law_1.01,0.950534439086914
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,2048,768,8,128,2,64,balanced,0.05046933392683665
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,2048,768,8,128,2,64,power_law_1.01,0.16202880144119264
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,2048,768,8,128,2,64,power_law_1.2,0.02261119931936264
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,2048,768,8,128,2,64,power_law_1.01,0.22850561141967773
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,2048,768,8,128,2,64,power_law_1.01,0.04007680118083954
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,2048,768,8,128,2,64,power_law_1.2,0.025964799523353576
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,2048,768,8,128,2,64,power_law_1.01,0.289849591255188
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,2048,768,8,128,2,64,power_law_1.01,0.04743039906024933
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,2048,768,8,128,2,64,power_law_1.2,0.022419199347496033
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,2048,768,8,128,2,64,power_law_1.01,0.35907199382781985
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,2048,768,8,128,2,64,power_law_1.01,0.052825599908828735
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,2048,768,8,128,2,64,power_law_1.2,0.023603199422359465
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,2048,768,8,128,2,64,power_law_1.01,0.5705088138580322
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,2048,768,8,128,2,64,power_law_1.2,0.024352000653743745
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,2048,768,8,128,2,64,balanced,0.06558933357397716
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,2048,768,8,128,2,64,power_law_1.01,0.06788480281829834
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,2048,768,8,128,2,64,power_law_1.01,1.164192008972168
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,2048,768,8,128,2,64,power_law_1.2,0.024908800423145295
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,2048,768,8,128,2,64,power_law_1.01,0.08202880024909973
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,2048,768,8,128,2,64,power_law_1.2,0.025356799364089966
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,2048,768,8,128,2,64,balanced,0.2680000066757202
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,2048,768,8,128,2,64,power_law_1.2,0.028249600529670717
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,2048,768,8,128,2,64,power_law_1.2,0.03078399896621704
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,2048,768,8,128,2,64,power_law_1.01,0.0959231972694397
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,2048,768,8,128,2,64,power_law_1.2,0.03125759959220886
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,2048,768,8,128,2,64,power_law_1.01,0.12726399898529053
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,2048,768,8,128,2,64,balanced,0.07800533374150594
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,2048,768,8,128,2,64,power_law_1.2,0.0321727991104126
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,2048,768,8,128,2,64,power_law_1.2,0.03277440071105957
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,2048,768,8,128,2,64,power_law_1.01,0.1573632001876831
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,2048,768,8,128,2,64,power_law_1.2,0.034092798829078674
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,2048,768,8,128,2,64,power_law_1.2,0.03619199991226196
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,2048,768,8,128,2,64,power_law_1.01,0.19390079975128174
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,2048,768,8,128,2,64,power_law_1.2,0.037363201379776
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,2048,768,8,128,2,64,power_law_1.2,0.03788160085678101
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,2048,768,8,128,2,64,power_law_1.2,0.039852800965309146
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,2048,768,8,128,2,64,balanced,0.10538132985432942
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,2048,768,8,128,2,64,power_law_1.01,0.32739839553833006
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,2048,768,8,128,2,64,balanced,0.23512534300486246
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,2048,768,8,128,2,64,power_law_1.2,0.04723199903964996
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,2048,768,8,128,2,64,power_law_1.2,0.05594239830970764
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,2048,768,8,128,2,64,power_law_1.2,0.07582079768180847
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,2048,768,8,128,2,64,power_law_1.01,0.36854400634765627
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,2048,768,8,128,2,64,power_law_1.2,0.08009600043296813
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,2048,768,8,128,2,64,power_law_1.2,0.10107519626617431
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,2048,768,8,128,2,64,power_law_1.01,0.4850175857543945
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,2048,768,8,128,2,64,power_law_1.2,0.12116479873657227
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,2048,768,8,128,2,64,balanced,0.12905599673589072
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,2048,768,8,128,2,64,power_law_1.01,0.7537536144256591
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,2048,768,8,128,2,64,power_law_1.2,0.1460543990135193
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,2048,768,8,128,2,64,power_law_1.2,0.21713919639587403
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,2048,768,8,128,2,64,power_law_1.01,1.508415985107422
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,2048,768,8,128,2,64,power_law_1.2,0.31154561042785645
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,2048,768,8,128,2,64,power_law_1.2,0.3441472053527832
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,2048,768,8,128,2,64,balanced,0.4923893213272095
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,2048,768,8,128,2,64,power_law_1.2,0.47493758201599123
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,2048,768,8,128,2,64,power_law_1.2,0.6486911773681641
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,2048,768,8,128,2,64,power_law_1.2,1.8151231765747071
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,2048,768,8,128,2,64,balanced,0.15370666980743408
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,2048,768,8,128,2,64,balanced,0.23172267278035483
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,2048,768,8,128,2,64,power_law_1.2,0.03136000037193298
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,2048,768,8,128,2,64,power_law_1.2,0.028934401273727418
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,2048,768,8,128,2,64,power_law_1.2,0.02879360020160675
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,2048,768,8,128,2,64,power_law_1.2,0.03187200129032135
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,2048,768,8,128,2,64,power_law_1.2,0.033267199993133545
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,2048,768,8,128,2,64,power_law_1.2,0.03278079926967621
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,2048,768,8,128,2,64,power_law_1.2,0.033055999875068666
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,2048,768,8,128,2,64,power_law_1.2,0.03356800079345703
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,2048,768,8,128,2,64,power_law_1.2,0.033529600501060484
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,2048,768,8,128,2,64,power_law_1.2,0.033855998516082765
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,2048,768,8,128,2,64,power_law_1.2,0.03473280072212219
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,2048,768,8,128,2,64,power_law_1.2,0.03526400029659271
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,2048,768,8,128,2,64,power_law_1.2,0.036268800497055054
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,2048,768,8,128,2,64,power_law_1.2,0.03715839982032776
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,2048,768,8,128,2,64,power_law_1.2,0.039878401160240176
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,2048,768,8,128,2,64,power_law_1.2,0.0409855991601944
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,2048,768,8,128,2,64,power_law_1.2,0.04442239999771118
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,2048,768,8,128,2,64,power_law_1.2,0.047775998711586
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,2048,768,8,128,2,64,power_law_1.2,0.051622402667999265
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,2048,768,8,128,2,64,power_law_1.2,0.06333439946174621
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,2048,768,8,128,2,64,power_law_1.2,0.07441920042037964
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,2048,768,8,128,2,64,balanced,0.45602134863535565
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,2048,768,8,128,2,64,power_law_1.2,0.10755840539932252
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,2048,768,8,128,2,64,power_law_1.2,0.11349120140075683
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,2048,768,8,128,2,64,power_law_1.2,0.17503360509872437
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,2048,768,8,128,2,64,power_law_1.2,0.022329600155353548
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,2048,768,8,128,2,64,power_law_1.2,0.2149183988571167
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,2048,768,8,128,2,64,power_law_1.2,0.02189439982175827
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,2048,768,8,128,2,64,power_law_1.2,0.3480384111404419
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,2048,768,8,128,2,64,power_law_1.2,0.022310400009155275
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,2048,768,8,128,2,64,power_law_1.2,0.43114237785339354
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,2048,768,8,128,2,64,power_law_1.2,0.024332800507545473
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,2048,768,8,128,4,32,balanced,0.023599999646345775
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,2048,768,8,128,2,64,power_law_1.2,0.5730048179626465
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,2048,768,8,128,2,64,power_law_1.2,0.02510719895362854
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,2048,768,8,128,2,64,power_law_1.2,0.9378239631652832
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,2048,768,8,128,4,32,balanced,0.02186666677395503
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,2048,768,8,128,2,64,power_law_1.2,0.025747200846672057
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,2048,768,8,128,2,64,power_law_1.2,0.02635520100593567
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,2048,768,8,128,2,64,power_law_1.2,2.237676811218262
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,2048,768,8,128,4,32,balanced,0.021712000171343487
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,2048,768,8,128,2,64,power_law_1.2,0.026444798707962035
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,2048,768,8,128,4,32,balanced,0.023232000569502514
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,2048,768,8,128,2,64,power_law_1.2,0.026643198728561402
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,2048,768,8,128,4,32,balanced,0.023669332265853882
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,2048,768,8,128,2,64,power_law_1.2,0.0268095999956131
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,2048,768,8,128,4,32,balanced,0.02492800106604894
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,2048,768,8,128,2,64,power_law_1.2,0.027769601345062254
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,2048,768,8,128,4,32,balanced,0.025333332518736523
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,2048,768,8,128,2,64,power_law_1.2,0.0282368004322052
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,2048,768,8,128,4,32,balanced,0.025290665527184803
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,2048,768,8,128,4,32,balanced,0.024874667326609295
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,2048,768,8,128,2,64,power_law_1.2,0.029241600632667543
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,2048,768,8,128,4,32,balanced,0.025439999997615814
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,2048,768,8,128,2,64,power_law_1.2,0.031699201464653014
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,2048,768,8,128,4,32,balanced,0.02595199892918269
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,2048,768,8,128,4,32,balanced,0.02651199946800868
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,2048,768,8,128,2,64,power_law_1.2,0.034796801209449765
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,2048,768,8,128,4,32,balanced,0.02677333354949951
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,2048,768,8,128,2,64,power_law_1.2,0.036051198840141296
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,2048,768,8,128,4,32,balanced,0.03461333364248276
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,2048,768,8,128,4,32,balanced,0.03033600002527237
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,2048,768,8,128,4,32,balanced,0.03504000107447306
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,2048,768,8,128,4,32,balanced,0.03514133393764496
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,2048,768,8,128,2,64,power_law_1.2,0.04161919951438904
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,2048,768,8,128,4,32,balanced,0.028917332490285236
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,2048,768,8,128,4,32,balanced,0.03867200016975403
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,2048,768,8,128,4,32,balanced,0.02852799991766612
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,2048,768,8,128,2,64,power_law_1.2,0.05353599786758423
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,2048,768,8,128,4,32,balanced,0.030981334547201794
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,2048,768,8,128,4,32,balanced,0.03842666745185852
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,2048,768,8,128,2,64,power_law_1.2,0.06444159746170045
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,2048,768,8,128,4,32,balanced,0.03267733256022135
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,2048,768,8,128,4,32,balanced,0.03977066775163015
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,2048,768,8,128,4,32,balanced,0.03332799921433131
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,2048,768,8,128,4,32,balanced,0.040336000422636666
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,2048,768,8,128,4,32,balanced,0.03349866718053818
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,2048,768,8,128,2,64,power_law_1.2,0.08557440042495727
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,2048,768,8,128,4,32,balanced,0.033359999457995095
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,2048,768,8,128,4,32,balanced,0.043141335248947144
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,2048,768,8,128,4,32,balanced,0.033615998923778534
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,2048,768,8,128,2,64,power_law_1.2,0.08767359852790832
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,2048,768,8,128,4,32,balanced,0.03462400039037069
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,2048,768,8,128,4,32,balanced,0.05276800195376078
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,2048,768,8,128,4,32,balanced,0.03509866694609324
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,2048,768,8,128,4,32,balanced,0.03480000048875809
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,2048,768,8,128,2,64,power_law_1.2,0.12369279861450196
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,2048,768,8,128,4,32,balanced,0.03596800069014231
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,2048,768,8,128,2,64,power_law_1.2,0.1533951997756958
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,2048,768,8,128,4,32,balanced,0.05256533126036326
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,2048,768,8,128,4,32,balanced,0.03612799942493439
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,2048,768,8,128,4,32,balanced,0.022602667411168415
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,2048,768,8,128,4,32,power_law_1.01,0.02423679977655411
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,2048,768,8,128,4,32,balanced,0.03864533454179764
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,2048,768,8,128,4,32,balanced,0.022618666291236877
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,2048,768,8,128,2,64,power_law_1.2,0.22627840042114258
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,2048,768,8,128,4,32,balanced,0.038506666819254555
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,2048,768,8,128,4,32,balanced,0.022474666436513264
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,2048,768,8,128,4,32,power_law_1.01,0.021350400149822236
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,2048,768,8,128,4,32,balanced,0.0646666685740153
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,2048,768,8,128,4,32,power_law_1.01,0.032128000259399415
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,2048,768,8,128,4,32,balanced,0.024480000138282776
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,2048,768,8,128,4,32,power_law_1.01,0.021503999829292297
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,2048,768,8,128,4,32,balanced,0.03974399964014689
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,2048,768,8,128,2,64,power_law_1.2,0.315231990814209
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,2048,768,8,128,4,32,power_law_1.01,0.029318401217460634
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,2048,768,8,128,4,32,balanced,0.025802666942278545
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,2048,768,8,128,4,32,balanced,0.04048533240954081
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,2048,768,8,128,4,32,power_law_1.01,0.022835199534893037
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,2048,768,8,128,4,32,balanced,0.026613332331180573
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,2048,768,8,128,4,32,power_law_1.01,0.029382398724555968
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,2048,768,8,128,4,32,power_law_1.01,0.02341119945049286
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,2048,768,8,128,4,32,balanced,0.06669333577156067
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,2048,768,8,128,4,32,balanced,0.04189866781234741
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,2048,768,8,128,2,64,power_law_1.2,0.5567808151245117
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,2048,768,8,128,4,32,balanced,0.026928000152111053
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,2048,768,8,128,4,32,power_law_1.01,0.03127039968967438
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,2048,768,8,128,4,32,power_law_1.01,0.02454400062561035
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,2048,768,8,128,4,32,balanced,0.026943999032179516
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,2048,768,8,128,4,32,balanced,0.045909335215886436
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,2048,768,8,128,4,32,power_law_1.01,0.03155199885368347
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,2048,768,8,128,4,32,balanced,0.026954665780067444
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,2048,768,8,128,4,32,power_law_1.01,0.024480000138282776
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,2048,768,8,128,2,64,power_law_1.2,0.6082111835479737
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,2048,768,8,128,4,32,power_law_1.01,0.033030399680137636
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,2048,768,8,128,4,32,balanced,0.027456000447273254
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,2048,768,8,128,4,32,power_law_1.01,0.02462719976902008
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,2048,768,8,128,4,32,balanced,0.04861866434415182
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,2048,768,8,128,4,32,power_law_1.01,0.033107200264930726
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,2048,768,8,128,4,32,balanced,0.027978666126728058
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,2048,768,8,128,2,64,power_law_1.2,0.9286144256591797
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,2048,768,8,128,4,32,power_law_1.01,0.029977598786354066
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,2048,768,8,128,4,32,power_law_1.01,0.03395200073719025
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,2048,768,8,128,4,32,balanced,0.028149334092934925
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,2048,768,8,128,4,32,balanced,0.08999466896057129
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,2048,768,8,128,4,32,balanced,0.06292266647020976
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,2048,768,8,128,4,32,power_law_1.01,0.030406400561332703
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,2048,768,8,128,2,64,power_law_1.2,1.7626047134399414
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,2048,768,8,128,4,32,power_law_1.01,0.03333759903907776
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,2048,768,8,128,4,32,balanced,0.0288426677385966
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,2048,768,8,128,4,32,power_law_1.01,0.03343360126018524
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,2048,768,8,128,4,32,power_law_1.01,0.03320319950580597
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,2048,768,8,128,4,32,balanced,0.029365333418051403
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,2048,768,8,128,2,64,power_law_1.2,3.0198720932006835
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,2048,768,8,128,4,32,power_law_1.01,0.03592320084571839
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,2048,768,8,128,4,32,balanced,0.07055999835332234
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,2048,768,8,128,4,32,balanced,0.03233599911133448
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,2048,768,8,128,4,32,power_law_1.01,0.03409920036792755
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,2048,768,8,128,4,32,power_law_1.01,0.03925119936466217
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,2048,768,8,128,4,32,balanced,0.03173866619666418
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,2048,768,8,128,4,32,power_law_1.01,0.03475840091705322
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,2048,768,8,128,4,32,power_law_1.01,0.03528960049152374
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,2048,768,8,128,4,32,power_law_1.01,0.03591679930686951
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,2048,768,8,128,4,32,balanced,0.09250133236249287
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,2048,768,8,128,4,32,power_law_1.01,0.037088000774383546
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,2048,768,8,128,4,32,power_law_1.01,0.037567999958992
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,2048,768,8,128,4,32,balanced,0.09948266545931499
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,2048,768,8,128,4,32,power_law_1.01,0.03731200098991394
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,2048,768,8,128,4,32,power_law_1.01,0.03997440040111542
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,2048,768,8,128,4,32,balanced,0.03298133363326391
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,2048,768,8,128,4,32,power_law_1.01,0.03929600119590759
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,2048,768,8,128,4,32,power_law_1.01,0.0404992014169693
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,2048,768,8,128,4,32,balanced,0.035562666753927864
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,2048,768,8,128,4,32,power_law_1.01,0.045414400100708005
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,2048,768,8,128,4,32,balanced,0.10700266559918721
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,2048,768,8,128,4,32,power_law_1.01,0.04300160109996796
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,2048,768,8,128,4,32,power_law_1.01,0.048230400681495665
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,2048,768,8,128,4,32,balanced,0.03549866626660029
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,2048,768,8,128,4,32,power_law_1.01,0.04782719910144806
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,2048,768,8,128,4,32,power_law_1.01,0.057081598043441775
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,2048,768,8,128,4,32,power_law_1.01,0.04896000027656555
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,2048,768,8,128,4,32,power_law_1.01,0.0617792010307312
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,2048,768,8,128,4,32,power_law_1.01,0.05994240045547485
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,2048,768,8,128,4,32,power_law_1.01,0.08128640055656433
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,2048,768,8,128,4,32,power_law_1.01,0.06709759831428527
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,2048,768,8,128,4,32,balanced,0.04077333211898804
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,2048,768,8,128,4,32,balanced,0.14452266693115234
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,2048,768,8,128,4,32,power_law_1.01,0.07986559867858886
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,2048,768,8,128,4,32,balanced,0.11685333649317424
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,2048,768,8,128,4,32,power_law_1.01,0.09057919979095459
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,2048,768,8,128,4,32,power_law_1.01,0.10424959659576416
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,2048,768,8,128,4,32,balanced,0.043040002385775246
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,2048,768,8,128,4,32,power_law_1.01,0.09903360009193421
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,2048,768,8,128,4,32,power_law_1.01,0.12151039838790893
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,2048,768,8,128,4,32,power_law_1.01,0.1400063991546631
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,2048,768,8,128,4,32,power_law_1.01,0.17091200351715088
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,2048,768,8,128,4,32,power_law_1.01,0.1605504035949707
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,2048,768,8,128,4,32,power_law_1.01,0.22672638893127442
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,2048,768,8,128,4,32,power_law_1.01,0.20314879417419435
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,2048,768,8,128,4,32,balanced,0.05352533360322317
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,2048,768,8,128,4,32,power_law_1.01,0.2979007959365845
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,2048,768,8,128,4,32,power_law_1.01,0.24824960231781007
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,2048,768,8,128,4,32,balanced,0.1738719940185547
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,2048,768,8,128,4,32,power_law_1.01,0.34345600605010984
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,2048,768,8,128,4,32,power_law_1.01,0.4258687973022461
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,2048,768,8,128,4,32,balanced,0.061119998494784035
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,2048,768,8,128,4,32,power_law_1.01,0.5554751873016357
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,2048,768,8,128,4,32,power_law_1.01,0.7736512184143066
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,2048,768,8,128,4,32,power_law_1.01,1.2468031883239745
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,2048,768,8,128,4,32,balanced,0.16904000441233316
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,2048,768,8,128,4,32,balanced,0.0796853353579839
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,2048,768,8,128,4,32,balanced,0.20746666193008423
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,2048,768,8,128,4,32,balanced,0.09709866841634114
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,2048,768,8,128,4,32,power_law_1.01,0.023763200640678404
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,2048,768,8,128,4,32,power_law_1.01,0.02268799990415573
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,2048,768,8,128,4,32,power_law_1.01,0.02284799963235855
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,2048,768,8,128,4,32,power_law_1.01,0.024928000569343568
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,2048,768,8,128,4,32,power_law_1.01,0.025388801097869874
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,2048,768,8,128,4,32,power_law_1.01,0.02648319900035858
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,2048,768,8,128,4,32,power_law_1.2,0.02401919960975647
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,2048,768,8,128,4,32,power_law_1.01,0.027001601457595826
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,2048,768,8,128,4,32,power_law_1.2,0.02131839990615845
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,2048,768,8,128,4,32,balanced,0.1327946682771047
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,2048,768,8,128,4,32,power_law_1.01,0.02717440128326416
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,2048,768,8,128,4,32,power_law_1.2,0.021350400149822236
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,2048,768,8,128,4,32,balanced,0.3099626700083415
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,2048,768,8,128,4,32,power_law_1.01,0.027039998769760133
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,2048,768,8,128,4,32,power_law_1.2,0.022892799973487855
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,2048,768,8,128,4,32,power_law_1.01,0.027315199375152588
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,2048,768,8,128,4,32,power_law_1.2,0.02620159983634949
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,2048,768,8,128,4,32,power_law_1.2,0.02447360008955002
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,2048,768,8,128,4,32,power_law_1.01,0.02826879918575287
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,2048,768,8,128,4,32,power_law_1.2,0.024633599817752837
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,2048,768,8,128,4,32,power_law_1.01,0.029292801022529603
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,2048,768,8,128,4,32,power_law_1.2,0.02771199941635132
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,2048,768,8,128,4,32,power_law_1.01,0.030822399258613586
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,2048,768,8,128,4,32,power_law_1.2,0.030297601222991945
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,2048,768,8,128,4,32,power_law_1.01,0.031718400120735166
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,2048,768,8,128,4,32,power_law_1.2,0.030796799063682555
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,2048,768,8,128,4,32,power_law_1.01,0.03410559892654419
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,2048,768,8,128,4,32,power_law_1.2,0.03447679877281189
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,2048,768,8,128,4,32,balanced,0.1646346648534139
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,2048,768,8,128,4,32,power_law_1.01,0.03699840009212494
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,2048,768,8,128,4,32,power_law_1.2,0.04000000059604645
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,2048,768,8,128,4,32,power_law_1.2,0.04519680142402649
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,2048,768,8,128,4,32,balanced,0.3001493414243062
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,2048,768,8,128,4,32,power_law_1.2,0.0348800003528595
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,2048,768,8,128,4,32,power_law_1.01,0.04063999950885773
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,2048,768,8,128,4,32,power_law_1.2,0.037215998768806456
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,2048,768,8,128,4,32,power_law_1.01,0.04840959906578064
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,2048,768,8,128,4,32,power_law_1.2,0.0377344012260437
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,2048,768,8,128,4,32,power_law_1.01,0.05422080159187317
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,2048,768,8,128,4,32,power_law_1.2,0.04071680009365082
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,2048,768,8,128,4,32,power_law_1.2,0.04625279903411865
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,2048,768,8,128,4,32,power_law_1.2,0.050918400287628174
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,2048,768,8,128,4,32,balanced,0.200655996799469
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,2048,768,8,128,4,32,power_law_1.01,0.06687359809875489
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,2048,768,8,128,4,32,power_law_1.2,0.06327679753303528
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,2048,768,8,128,4,32,power_law_1.01,0.07360640168190002
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,2048,768,8,128,4,32,power_law_1.2,0.0743615984916687
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,2048,768,8,128,4,32,power_law_1.2,0.10200320482254029
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,2048,768,8,128,4,32,power_law_1.01,0.09522560238838196
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,2048,768,8,128,4,32,power_law_1.2,0.10181759595870972
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,2048,768,8,128,4,32,power_law_1.01,0.11749759912490845
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,2048,768,8,128,4,32,power_law_1.2,0.15794559717178344
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,2048,768,8,128,4,32,power_law_1.2,0.18236160278320312
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,2048,768,8,128,4,32,power_law_1.01,0.15273599624633788
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,2048,768,8,128,4,32,power_law_1.2,0.24476799964904786
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,2048,768,8,128,4,32,balanced,0.5768426656723022
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,2048,768,8,128,4,32,power_law_1.2,0.30680320262908933
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,2048,768,8,128,4,32,power_law_1.01,0.2241215944290161
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,2048,768,8,128,4,32,power_law_1.2,0.333459210395813
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,2048,768,8,128,4,32,power_law_1.01,0.31875200271606446
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,2048,768,8,128,4,32,power_law_1.2,0.5980991840362548
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,2048,768,8,128,4,32,balanced,0.32530667384465534
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,2048,768,8,128,4,32,power_law_1.01,0.4093503952026367
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,2048,768,8,128,4,32,power_law_1.2,1.5299391746520996
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,2048,768,8,128,4,32,power_law_1.01,0.5613120079040528
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,2048,768,8,128,4,32,power_law_1.2,0.03249920010566711
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,2048,768,8,128,4,32,power_law_1.01,0.7742464065551757
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,2048,768,8,128,4,32,power_law_1.2,0.02927359938621521
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,2048,768,8,128,4,32,power_law_1.01,1.804742431640625
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,2048,768,8,128,4,32,power_law_1.2,0.02887679934501648
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,2048,768,8,128,4,32,power_law_1.2,0.03112959861755371
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,2048,768,8,128,4,32,power_law_1.2,0.031744000315666196
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,2048,768,8,128,4,32,power_law_1.2,0.03299199938774109
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,2048,768,8,128,4,32,power_law_1.2,0.03292160034179688
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,2048,768,8,128,4,32,power_law_1.2,0.033632001280784606
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,2048,768,8,128,4,32,power_law_1.2,0.033369600772857666
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,2048,768,8,128,4,32,power_law_1.2,0.03348479866981506
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,2048,768,8,128,4,32,power_law_1.2,0.035257598757743834
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,2048,768,8,128,4,32,power_law_1.2,0.03598720133304596
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,2048,768,8,128,4,32,power_law_1.2,0.03811840116977692
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,2048,768,8,128,4,32,power_law_1.2,0.038515201210975646
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,2048,768,8,128,4,32,power_law_1.2,0.04012799859046936
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,2048,768,8,128,4,32,power_law_1.2,0.04160000085830688
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,2048,768,8,128,4,32,power_law_1.2,0.045126399397850035
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,2048,768,8,128,4,32,power_law_1.2,0.04838399887084961
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,2048,768,8,128,4,32,power_law_1.2,0.05242239832878113
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,2048,768,8,128,4,32,power_law_1.2,0.06566399931907654
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,2048,768,8,128,4,32,balanced,0.6208000183105469
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,2048,768,8,128,4,32,power_law_1.2,0.07491199970245362
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,2048,768,8,128,4,32,power_law_1.2,0.10261759757995606
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,2048,768,8,128,4,32,power_law_1.2,0.02399359941482544
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,2048,768,8,128,4,32,power_law_1.2,0.10806399583816528
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,2048,768,8,128,4,32,power_law_1.2,0.022361600399017335
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,2048,768,8,128,4,32,power_law_1.2,0.1539520025253296
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,2048,768,8,128,4,32,power_law_1.2,0.023001599311828613
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,2048,768,8,128,4,32,power_law_1.2,0.2558271884918213
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,2048,768,8,128,4,32,power_law_1.2,0.025062400102615356
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,2048,768,8,128,4,32,power_law_1.2,0.37876479625701903
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,4096,1536,8,128,1,128,balanced,0.09455999732017517
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,2048,768,8,128,4,32,power_law_1.2,0.02555519938468933
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,2048,768,8,128,4,32,power_law_1.2,0.3946880102157593
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,4096,1536,8,128,1,128,balanced,0.08659199873606364
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,2048,768,8,128,4,32,power_law_1.2,0.026739200949668883
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,4096,1536,8,128,1,128,balanced,0.08702400326728821
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,2048,768,8,128,4,32,power_law_1.2,0.5158080101013184
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,2048,768,8,128,4,32,power_law_1.2,0.02691200077533722
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,4096,1536,8,128,1,128,balanced,0.09194133679072063
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,2048,768,8,128,4,32,power_law_1.2,0.9902976036071778
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,2048,768,8,128,4,32,power_law_1.2,0.026956799626350402
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,4096,1536,8,128,1,128,balanced,0.08869866530100505
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,2048,768,8,128,4,32,power_law_1.2,0.026931199431419372
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,2048,768,8,128,4,32,power_law_1.2,2.1930112838745117
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,4096,1536,8,128,1,128,balanced,0.09502933422724406
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,2048,768,8,128,4,32,power_law_1.2,0.027276799082756042
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,4096,1536,8,128,1,128,balanced,0.09518933296203613
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,4096,1536,8,128,1,128,balanced,0.09822400410970052
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,2048,768,8,128,4,32,power_law_1.2,0.028787198662757873
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,4096,1536,8,128,1,128,balanced,0.08927999933560689
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,2048,768,8,128,4,32,power_law_1.2,0.030073601007461547
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,4096,1536,8,128,1,128,balanced,0.09898666540781657
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,2048,768,8,128,4,32,power_law_1.2,0.03086079955101013
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,4096,1536,8,128,1,128,balanced,0.10203733046849568
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,2048,768,8,128,4,32,power_law_1.2,0.03229439854621887
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,4096,1536,8,128,1,128,balanced,0.10188800096511841
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,2048,768,8,128,4,32,power_law_1.2,0.03711360096931458
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,4096,1536,8,128,1,128,balanced,0.09820800026257832
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,2048,768,8,128,4,32,power_law_1.2,0.037785598635673524
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,4096,1536,8,128,1,128,balanced,0.0904319981733958
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,4096,1536,8,128,1,128,balanced,0.09694400429725647
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,2048,768,8,128,4,32,power_law_1.2,0.042387199401855466
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,4096,1536,8,128,1,128,balanced,0.10289600491523743
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,2048,768,8,128,4,32,power_law_1.2,0.05211520195007324
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,2048,768,8,128,4,32,power_law_1.2,0.061945599317550656
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,4096,1536,8,128,1,128,balanced,0.09085333347320557
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,4096,1536,8,128,1,128,balanced,0.09058666229248047
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,2048,768,8,128,4,32,power_law_1.2,0.0805184006690979
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,4096,1536,8,128,1,128,balanced,0.08675733208656311
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,4096,1536,8,128,1,128,balanced,0.061978667974472046
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,2048,768,8,128,4,32,power_law_1.2,0.0867904007434845
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,4096,1536,8,128,1,128,balanced,0.08284266789754231
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,4096,1536,8,128,1,128,balanced,0.06257600088914235
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,4096,1536,8,128,1,128,balanced,0.06196799874305725
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,2048,768,8,128,4,32,power_law_1.2,0.11160320043563843
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,4096,1536,8,128,1,128,balanced,0.07422933479150136
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,4096,1536,8,128,1,128,balanced,0.06422399977842967
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,2048,768,8,128,4,32,power_law_1.2,0.15175039768218995
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,4096,1536,8,128,1,128,balanced,0.06471999982992808
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,4096,1536,8,128,1,128,balanced,0.06607999900976817
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,4096,1536,8,128,1,128,balanced,0.12133866548538208
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,4096,1536,8,128,1,128,balanced,0.06102400024731954
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,4096,1536,8,128,1,128,balanced,0.06676800052324931
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,2048,768,8,128,4,32,power_law_1.2,0.3233920097351074
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,4096,1536,8,128,1,128,balanced,0.060933331648508705
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,4096,1536,8,128,1,128,balanced,0.10487999518712361
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,4096,1536,8,128,1,128,balanced,0.06720000008742015
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,2048,768,8,128,4,32,power_law_1.2,0.35009920597076416
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,4096,1536,8,128,1,128,balanced,0.06579199930032094
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,4096,1536,8,128,1,128,balanced,0.06472533444563548
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,4096,1536,8,128,1,128,balanced,0.06551999847094218
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,4096,1536,8,128,1,128,balanced,0.14717866977055868
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,2048,768,8,128,4,32,power_law_1.2,0.5462336063385009
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,4096,1536,8,128,1,128,balanced,0.06321600079536438
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,4096,1536,8,128,1,128,balanced,0.06763733426729839
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,2048,768,8,128,4,32,power_law_1.2,0.6218431949615478
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,4096,1536,8,128,1,128,balanced,0.07049066821734111
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,4096,1536,8,128,1,128,balanced,0.0687306672334671
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,2048,768,8,128,4,32,power_law_1.2,0.7269375801086426
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,4096,1536,8,128,1,128,balanced,0.17694399754206339
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,4096,1536,8,128,1,128,balanced,0.070783997575442
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,2048,768,8,128,4,32,power_law_1.2,1.778335952758789
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,4096,1536,8,128,1,128,balanced,0.07216533521811168
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,2048,768,8,128,4,32,power_law_1.2,2.8318336486816404
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,4096,1536,8,128,1,128,balanced,0.07899199922879536
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,4096,1536,8,128,1,128,balanced,0.25034133593241376
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,4096,1536,8,128,1,128,balanced,0.08032000064849854
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,4096,1536,8,128,1,128,balanced,0.12122666835784912
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,4096,1536,8,128,1,128,power_law_1.01,0.09537919759750366
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,4096,1536,8,128,1,128,balanced,0.027552001178264618
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,4096,1536,8,128,1,128,power_law_1.01,0.08491520285606384
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,4096,1536,8,128,1,128,balanced,0.027295999228954315
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,4096,1536,8,128,1,128,balanced,0.1200213332970937
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,4096,1536,8,128,1,128,power_law_1.01,0.09455360174179077
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,4096,1536,8,128,1,128,balanced,0.02754133443037669
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,4096,1536,8,128,1,128,power_law_1.01,0.09189119935035706
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,4096,1536,8,128,1,128,balanced,0.02865600089232127
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,4096,1536,8,128,1,128,balanced,0.32184000809987384
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,4096,1536,8,128,1,128,power_law_1.01,0.09510400295257568
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,4096,1536,8,128,1,128,power_law_1.01,0.05839999914169312
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,4096,1536,8,128,1,128,balanced,0.02975466599067052
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,4096,1536,8,128,1,128,balanced,0.16632533073425293
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,4096,1536,8,128,1,128,power_law_1.01,0.09761279821395874
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,4096,1536,8,128,1,128,balanced,0.0308746670683225
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,4096,1536,8,128,1,128,power_law_1.01,0.05934720039367676
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,4096,1536,8,128,1,128,power_law_1.01,0.09552639722824097
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,4096,1536,8,128,1,128,balanced,0.03088533381621043
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,4096,1536,8,128,1,128,power_law_1.01,0.058297598361968996
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,4096,1536,8,128,1,128,power_law_1.01,0.09745280146598816
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,4096,1536,8,128,1,128,balanced,0.030938667555650074
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,4096,1536,8,128,1,128,power_law_1.01,0.06542080044746398
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,4096,1536,8,128,1,128,power_law_1.01,0.08698239922523499
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,4096,1536,8,128,1,128,power_law_1.01,0.06155520081520081
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,4096,1536,8,128,1,128,balanced,0.031034665803114574
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,4096,1536,8,128,1,128,balanced,0.2041226625442505
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,4096,1536,8,128,1,128,power_law_1.01,0.09498879909515381
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,4096,1536,8,128,1,128,power_law_1.01,0.06355199813842774
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,4096,1536,8,128,1,128,balanced,0.03180799881617228
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,4096,1536,8,128,1,128,power_law_1.01,0.08857600092887878
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,4096,1536,8,128,1,128,power_law_1.01,0.06257920265197754
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,4096,1536,8,128,1,128,balanced,0.032314665615558624
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,4096,1536,8,128,1,128,power_law_1.01,0.08403840065002441
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,4096,1536,8,128,1,128,power_law_1.01,0.06519039869308471
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,4096,1536,8,128,1,128,balanced,0.3931573232014974
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,4096,1536,8,128,1,128,balanced,0.032399999598662056
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,4096,1536,8,128,1,128,power_law_1.01,0.08092799782752991
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,4096,1536,8,128,1,128,power_law_1.01,0.06017919778823853
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,4096,1536,8,128,1,128,balanced,0.033146666983763375
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,4096,1536,8,128,1,128,power_law_1.01,0.07705600261688232
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,4096,1536,8,128,1,128,power_law_1.01,0.06290559768676758
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,4096,1536,8,128,1,128,balanced,0.2874079942703247
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,4096,1536,8,128,1,128,balanced,0.033386667569478355
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,4096,1536,8,128,1,128,power_law_1.01,0.06505600214004517
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,4096,1536,8,128,1,128,power_law_1.01,0.06053119897842407
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,4096,1536,8,128,1,128,balanced,0.036090667049090065
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,4096,1536,8,128,1,128,power_law_1.01,0.13057279586791992
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,4096,1536,8,128,1,128,power_law_1.01,0.06047359704971313
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,4096,1536,8,128,1,128,balanced,0.03557866563399633
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,4096,1536,8,128,1,128,power_law_1.01,0.1106495976448059
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,4096,1536,8,128,1,128,power_law_1.01,0.05922560095787048
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,4096,1536,8,128,1,128,power_law_1.01,0.13473279476165773
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,4096,1536,8,128,1,128,power_law_1.01,0.05665919780731201
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,4096,1536,8,128,1,128,power_law_1.01,0.1743615984916687
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,4096,1536,8,128,1,128,power_law_1.01,0.0531391978263855
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,4096,1536,8,128,1,128,power_law_1.01,0.1879680037498474
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,4096,1536,8,128,1,128,power_law_1.01,0.07159680128097534
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,4096,1536,8,128,1,128,balanced,0.36926400661468506
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,4096,1536,8,128,1,128,balanced,0.036720000207424164
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,4096,1536,8,128,1,128,power_law_1.01,0.07578240036964416
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,4096,1536,8,128,1,128,power_law_1.01,0.2602560043334961
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,4096,1536,8,128,1,128,power_law_1.01,0.10295039415359497
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,4096,1536,8,128,1,128,power_law_1.01,0.3514496088027954
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,4096,1536,8,128,1,128,balanced,0.039647998909155525
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,4096,1536,8,128,1,128,power_law_1.01,0.10931839942932128
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,4096,1536,8,128,1,128,power_law_1.01,0.4795519828796387
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,4096,1536,8,128,1,128,balanced,0.0397119993964831
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,4096,1536,8,128,1,128,power_law_1.01,0.13948160409927368
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,4096,1536,8,128,1,128,balanced,0.6106400092442831
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,4096,1536,8,128,1,128,power_law_1.01,0.6892096042633057
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,4096,1536,8,128,1,128,power_law_1.01,0.18842240571975707
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,4096,1536,8,128,1,128,power_law_1.01,0.9388287544250489
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,4096,1536,8,128,1,128,power_law_1.01,0.25805439949035647
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,4096,1536,8,128,1,128,power_law_1.01,1.6582912445068358
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,4096,1536,8,128,1,128,power_law_1.01,0.32794239521026614
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,4096,1536,8,128,1,128,power_law_1.01,2.172646331787109
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,4096,1536,8,128,1,128,power_law_1.01,0.4557504177093506
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,4096,1536,8,128,1,128,power_law_1.01,0.02705279886722565
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,4096,1536,8,128,1,128,balanced,0.047877331574757896
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,4096,1536,8,128,1,128,balanced,0.45002134641011554
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,4096,1536,8,128,1,128,power_law_1.01,2.607187271118164
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,4096,1536,8,128,1,128,power_law_1.01,0.6384640216827393
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,4096,1536,8,128,1,128,power_law_1.01,0.027276799082756042
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,4096,1536,8,128,1,128,power_law_1.01,0.02723200023174286
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,4096,1536,8,128,1,128,balanced,0.05317866802215576
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,4096,1536,8,128,1,128,power_law_1.01,4.346803283691406
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,4096,1536,8,128,1,128,power_law_1.01,0.9097408294677735
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,4096,1536,8,128,1,128,power_law_1.01,0.02924799919128418
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,4096,1536,8,128,1,128,power_law_1.01,0.029708799719810487
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,4096,1536,8,128,1,128,power_law_1.2,0.10414719581604004
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,4096,1536,8,128,1,128,power_law_1.01,10.621427154541015
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,4096,1536,8,128,1,128,power_law_1.01,1.3136256217956543
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,4096,1536,8,128,1,128,power_law_1.01,0.03134720027446747
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,4096,1536,8,128,1,128,power_law_1.2,0.09251840114593506
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,4096,1536,8,128,1,128,power_law_1.01,0.03125759959220886
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,4096,1536,8,128,1,128,power_law_1.01,1.627724838256836
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,4096,1536,8,128,1,128,power_law_1.2,0.09397760033607483
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,4096,1536,8,128,1,128,power_law_1.01,0.0313728004693985
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,4096,1536,8,128,1,128,power_law_1.2,0.10465919971466064
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,4096,1536,8,128,1,128,power_law_1.01,0.03142400085926056
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,4096,1536,8,128,1,128,balanced,0.06567466755708058
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,4096,1536,8,128,1,128,power_law_1.01,2.8342079162597655
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,4096,1536,8,128,1,128,power_law_1.01,0.03175039887428284
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,4096,1536,8,128,1,128,power_law_1.2,0.09649279713630676
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,4096,1536,8,128,1,128,power_law_1.01,0.033107200264930726
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,4096,1536,8,128,1,128,power_law_1.2,0.10610560178756714
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,4096,1536,8,128,1,128,power_law_1.01,6.114137649536133
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,4096,1536,8,128,1,128,balanced,0.07231999933719635
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,4096,1536,8,128,1,128,power_law_1.01,0.033548799157142636
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,4096,1536,8,128,1,128,power_law_1.2,0.0930176019668579
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,4096,1536,8,128,1,128,power_law_1.01,0.03488639891147614
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,4096,1536,8,128,1,128,balanced,0.697264035542806
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,4096,1536,8,128,1,128,power_law_1.2,0.09215360283851623
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,4096,1536,8,128,1,128,power_law_1.01,0.04299519956111908
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,4096,1536,8,128,1,128,power_law_1.2,0.08625919818878174
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,4096,1536,8,128,1,128,power_law_1.01,0.04859519898891449
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,4096,1536,8,128,1,128,power_law_1.2,0.09186559915542603
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,4096,1536,8,128,1,128,power_law_1.01,0.050220799446105954
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,4096,1536,8,128,1,128,power_law_1.2,0.08295040130615235
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,4096,1536,8,128,1,128,power_law_1.2,0.08266239762306213
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,4096,1536,8,128,1,128,balanced,0.09109333157539368
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,4096,1536,8,128,1,128,power_law_1.2,0.07311360239982605
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,4096,1536,8,128,1,128,power_law_1.01,0.06225919723510742
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,4096,1536,8,128,1,128,balanced,1.1738399664560955
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,4096,1536,8,128,1,128,power_law_1.2,0.06151679754257202
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,4096,1536,8,128,1,128,power_law_1.01,0.08018559813499451
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,4096,1536,8,128,1,128,power_law_1.2,0.1239359974861145
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,4096,1536,8,128,1,128,power_law_1.01,0.10337920188903808
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,4096,1536,8,128,1,128,power_law_1.2,0.10428160429000854
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,4096,1536,8,128,1,128,power_law_1.2,0.11879680156707764
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,4096,1536,8,128,1,128,power_law_1.01,0.11591039896011353
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,4096,1536,8,128,1,128,power_law_1.2,0.15786240100860596
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,4096,1536,8,128,1,128,power_law_1.01,0.15260159969329834
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,4096,1536,8,128,1,128,power_law_1.2,0.1922943949699402
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,4096,1536,8,128,1,128,balanced,0.10800533493359883
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,4096,1536,8,128,1,128,power_law_1.2,0.29395840167999265
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,4096,1536,8,128,1,128,power_law_1.2,0.39580159187316893
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,4096,1536,8,128,1,128,power_law_1.01,0.184934401512146
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,4096,1536,8,128,1,128,power_law_1.2,0.4634431838989258
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,4096,1536,8,128,1,128,power_law_1.01,0.21728639602661132
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,4096,1536,8,128,1,128,power_law_1.2,0.7302527904510498
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,4096,1536,8,128,1,128,power_law_1.2,1.084928035736084
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,4096,1536,8,128,1,128,power_law_1.01,0.31448960304260254
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,4096,1536,8,128,1,128,balanced,0.15236266454060873
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,4096,1536,8,128,1,128,power_law_1.2,1.7235008239746095
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,4096,1536,8,128,1,128,power_law_1.2,2.6964288711547852
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,4096,1536,8,128,1,128,power_law_1.01,0.420959997177124
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,4096,1536,8,128,1,128,power_law_1.2,3.312255859375
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,4096,1536,8,128,1,128,power_law_1.01,0.6470975875854492
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,4096,1536,8,128,1,128,power_law_1.2,4.337433624267578
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,4096,1536,8,128,1,128,balanced,1.3527894020080566
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,4096,1536,8,128,1,128,power_law_1.2,0.062489598989486694
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,4096,1536,8,128,1,128,power_law_1.2,7.456806182861328
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,4096,1536,8,128,1,128,power_law_1.01,0.8407103538513183
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,4096,1536,8,128,1,128,power_law_1.2,0.06164479851722717
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,4096,1536,8,128,1,128,balanced,0.18799465894699097
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,4096,1536,8,128,1,128,power_law_1.2,0.06349440217018128
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,4096,1536,8,128,1,128,power_law_1.2,16.050086975097656
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,4096,1536,8,128,1,128,power_law_1.2,0.06670719981193543
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,4096,1536,8,128,1,128,power_law_1.2,0.06595199704170226
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,4096,1536,8,128,1,128,power_law_1.2,0.06732800006866455
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,4096,1536,8,128,1,128,power_law_1.2,0.06533759832382202
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,4096,1536,8,128,1,128,power_law_1.01,1.1667200088500977
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,4096,1536,8,128,1,128,power_law_1.2,0.06235520243644714
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,4096,1536,8,128,1,128,power_law_1.01,1.6268608093261718
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,4096,1536,8,128,1,128,power_law_1.2,0.06028159856796265
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,4096,1536,8,128,1,128,power_law_1.2,0.058963197469711306
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,4096,1536,8,128,1,128,power_law_1.01,3.2444480895996093
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,4096,1536,8,128,1,128,balanced,0.22781866788864136
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,4096,1536,8,128,1,128,power_law_1.2,0.061427199840545656
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,4096,1536,8,128,1,128,power_law_1.2,0.05699840188026428
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,4096,1536,8,128,1,128,power_law_1.2,0.05608320236206055
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,4096,1536,8,128,1,128,power_law_1.2,0.060236799716949466
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,4096,1536,8,128,1,128,power_law_1.2,0.08083199858665466
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,4096,1536,8,128,1,128,power_law_1.2,0.07711359858512878
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,4096,1536,8,128,1,128,power_law_1.2,0.08577280044555664
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,4096,1536,8,128,1,128,power_law_1.2,0.1185215950012207
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,4096,1536,8,128,1,128,power_law_1.2,0.15147520303726197
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,4096,1536,8,128,1,128,power_law_1.2,0.18845440149307252
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,4096,1536,8,128,1,128,power_law_1.2,0.25552639961242674
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,4096,1536,8,128,1,128,balanced,0.34118934472401935
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,4096,1536,8,128,1,128,power_law_1.2,0.38410239219665526
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,4096,1536,8,128,1,128,power_law_1.2,0.5220992088317871
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,4096,1536,8,128,1,128,power_law_1.2,0.756441593170166
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,4096,1536,8,128,1,128,power_law_1.2,1.0359231948852539
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,4096,1536,8,128,1,128,power_law_1.2,1.493945598602295
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,4096,1536,8,128,1,128,power_law_1.2,1.9809215545654297
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,4096,1536,8,128,1,128,power_law_1.2,2.531500816345215
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,4096,1536,8,128,1,128,power_law_1.2,4.03702392578125
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,4096,1536,8,128,1,128,power_law_1.2,8.022406768798827
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,4096,1536,8,128,1,128,power_law_1.2,0.0271807998418808
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,4096,1536,8,128,1,128,balanced,0.6776106357574463
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,4096,1536,8,128,1,128,power_law_1.2,0.02714880108833313
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,4096,1536,8,128,2,64,balanced,0.03465066601832708
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,4096,1536,8,128,1,128,power_law_1.2,0.027225598692893982
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,4096,1536,8,128,2,64,balanced,0.0342399999499321
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,4096,1536,8,128,1,128,power_law_1.2,0.029369598627090453
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,4096,1536,8,128,2,64,balanced,0.03422400106986364
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,4096,1536,8,128,1,128,power_law_1.2,0.0296640008687973
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,4096,1536,8,128,2,64,balanced,0.03526933242877325
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,4096,1536,8,128,1,128,power_law_1.2,0.030553600192070006
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,4096,1536,8,128,2,64,balanced,0.03925866633653641
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,4096,1536,8,128,1,128,power_law_1.2,0.03081600069999695
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,4096,1536,8,128,2,64,balanced,0.036015999813874565
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,4096,1536,8,128,1,128,power_law_1.2,0.0315200001001358
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,4096,1536,8,128,2,64,balanced,0.04068266600370407
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,4096,1536,8,128,1,128,power_law_1.2,0.03153280019760132
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,4096,1536,8,128,2,64,balanced,0.03676266719897588
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,4096,1536,8,128,2,64,balanced,0.03249066571394602
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,4096,1536,8,128,1,128,power_law_1.2,0.03199360072612763
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,4096,1536,8,128,2,64,balanced,0.03682133307059606
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,4096,1536,8,128,1,128,power_law_1.2,0.03343360126018524
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,4096,1536,8,128,2,64,balanced,0.03454400102297465
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,4096,1536,8,128,2,64,balanced,0.03624533365170161
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,4096,1536,8,128,2,64,balanced,0.04190400242805481
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,4096,1536,8,128,1,128,power_law_1.2,0.035020801424980166
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,4096,1536,8,128,2,64,balanced,0.0355679988861084
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,4096,1536,8,128,2,64,balanced,0.03885333240032196
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,4096,1536,8,128,1,128,power_law_1.2,0.04359039962291718
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,4096,1536,8,128,2,64,balanced,0.037445334096749626
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,4096,1536,8,128,2,64,balanced,0.042165334026018776
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,4096,1536,8,128,1,128,power_law_1.2,0.047091200947761536
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,4096,1536,8,128,2,64,balanced,0.036981334288915
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,4096,1536,8,128,2,64,balanced,0.042447999119758606
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,4096,1536,8,128,1,128,power_law_1.2,0.05608959794044495
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,4096,1536,8,128,2,64,balanced,0.03684266656637192
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,4096,1536,8,128,2,64,balanced,0.04386133452256521
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,4096,1536,8,128,1,128,power_law_1.2,0.06284800171852112
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,4096,1536,8,128,2,64,balanced,0.036981334288915
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,4096,1536,8,128,2,64,balanced,0.04563199977080027
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,4096,1536,8,128,2,64,balanced,0.03721600025892258
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,4096,1536,8,128,2,64,balanced,0.0473333348830541
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,4096,1536,8,128,2,64,balanced,0.03800000001986822
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,4096,1536,8,128,1,128,power_law_1.2,0.07848960161209106
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,4096,1536,8,128,2,64,balanced,0.047269334395726524
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,4096,1536,8,128,2,64,balanced,0.03860799968242645
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,4096,1536,8,128,1,128,power_law_1.2,0.10522880554199218
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,4096,1536,8,128,2,64,balanced,0.05107733110586802
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,4096,1536,8,128,2,64,balanced,0.038405333956082664
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,4096,1536,8,128,1,128,power_law_1.2,0.14067840576171875
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,4096,1536,8,128,2,64,balanced,0.05153599878152212
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,4096,1536,8,128,2,64,balanced,0.039103999733924866
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,4096,1536,8,128,2,64,balanced,0.04084266722202301
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,4096,1536,8,128,2,64,balanced,0.06471999982992808
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,4096,1536,8,128,1,128,power_law_1.2,0.173689603805542
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,4096,1536,8,128,2,64,balanced,0.04308266441027323
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,4096,1536,8,128,2,64,balanced,0.05904000004132589
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,4096,1536,8,128,1,128,power_law_1.2,0.2194688081741333
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,4096,1536,8,128,2,64,balanced,0.04283200204372406
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,4096,1536,8,128,2,64,balanced,0.044768000642458596
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,4096,1536,8,128,2,64,balanced,0.07336000104745229
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,4096,1536,8,128,1,128,power_law_1.2,0.2448512077331543
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,4096,1536,8,128,2,64,balanced,0.04839999973773956
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,4096,1536,8,128,1,128,power_law_1.2,0.3315840005874634
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,4096,1536,8,128,2,64,balanced,0.02664000044266383
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,4096,1536,8,128,2,64,power_law_1.01,0.03717760145664215
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,4096,1536,8,128,2,64,balanced,0.07157333195209503
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,4096,1536,8,128,2,64,balanced,0.05354666709899902
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,4096,1536,8,128,2,64,balanced,0.026554666459560394
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,4096,1536,8,128,2,64,power_law_1.01,0.035846400260925296
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,4096,1536,8,128,2,64,balanced,0.0672266681989034
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,4096,1536,8,128,2,64,power_law_1.01,0.035417601466178894
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,4096,1536,8,128,2,64,balanced,0.026693334182103474
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,4096,1536,8,128,1,128,power_law_1.2,0.5041024208068847
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,4096,1536,8,128,2,64,balanced,0.08962133526802063
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,4096,1536,8,128,2,64,balanced,0.028138667345046997
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,4096,1536,8,128,2,64,power_law_1.01,0.037254399061203
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,4096,1536,8,128,2,64,balanced,0.070783997575442
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,4096,1536,8,128,2,64,balanced,0.029637334247430164
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,4096,1536,8,128,2,64,power_law_1.01,0.037964800000190736
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,4096,1536,8,128,1,128,power_law_1.2,0.6734015941619873
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,4096,1536,8,128,2,64,balanced,0.030789333085219067
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,4096,1536,8,128,2,64,power_law_1.01,0.035769599676132205
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,4096,1536,8,128,2,64,balanced,0.09011200070381165
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,4096,1536,8,128,1,128,power_law_1.2,0.9830975532531738
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,4096,1536,8,128,2,64,balanced,0.030666666726271313
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,4096,1536,8,128,2,64,power_law_1.01,0.03563520014286041
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,4096,1536,8,128,2,64,balanced,0.09601599971453349
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,4096,1536,8,128,2,64,power_law_1.01,0.037324801087379456
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,4096,1536,8,128,2,64,balanced,0.030762667457262676
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,4096,1536,8,128,2,64,power_law_1.01,0.03607679903507233
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,4096,1536,8,128,2,64,power_law_1.01,0.038252800703048706
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,4096,1536,8,128,2,64,balanced,0.09983467062314351
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,4096,1536,8,128,2,64,balanced,0.030853333572546642
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,4096,1536,8,128,1,128,power_law_1.2,1.3592703819274903
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,4096,1536,8,128,2,64,power_law_1.01,0.042534399032592776
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,4096,1536,8,128,2,64,power_law_1.01,0.03785600066184998
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,4096,1536,8,128,2,64,balanced,0.031530665854612984
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,4096,1536,8,128,2,64,power_law_1.01,0.03583360016345978
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,4096,1536,8,128,2,64,power_law_1.01,0.046758401393890384
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,4096,1536,8,128,2,64,balanced,0.03198933353026708
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,4096,1536,8,128,2,64,power_law_1.01,0.036396801471710205
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,4096,1536,8,128,2,64,power_law_1.01,0.04999679923057556
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,4096,1536,8,128,2,64,power_law_1.01,0.03641600012779236
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,4096,1536,8,128,1,128,power_law_1.2,1.6770751953125
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,4096,1536,8,128,2,64,balanced,0.031871999303499855
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,4096,1536,8,128,2,64,balanced,0.12949867049853006
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,4096,1536,8,128,2,64,power_law_1.01,0.05162879824638367
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,4096,1536,8,128,2,64,power_law_1.01,0.03650560081005096
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,4096,1536,8,128,2,64,balanced,0.14079466462135315
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,4096,1536,8,128,2,64,balanced,0.03284800052642822
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,4096,1536,8,128,2,64,power_law_1.01,0.03709439933300018
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,4096,1536,8,128,1,128,power_law_1.2,2.47825927734375
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,4096,1536,8,128,2,64,power_law_1.01,0.051692801713943484
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,4096,1536,8,128,2,64,power_law_1.01,0.03740800023078918
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,4096,1536,8,128,2,64,balanced,0.033333333830038704
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,4096,1536,8,128,2,64,power_law_1.01,0.05082240104675293
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,4096,1536,8,128,2,64,power_law_1.01,0.037990400195121767
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,4096,1536,8,128,1,128,power_law_1.2,5.1021888732910154
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,4096,1536,8,128,2,64,balanced,0.03690666705369949
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,4096,1536,8,128,2,64,power_law_1.01,0.03953920006752014
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,4096,1536,8,128,2,64,power_law_1.01,0.053427201509475705
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,4096,1536,8,128,2,64,balanced,0.1530133287111918
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,4096,1536,8,128,2,64,power_law_1.01,0.041203200817108154
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,4096,1536,8,128,2,64,power_law_1.01,0.05550720095634461
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,4096,1536,8,128,2,64,balanced,0.036373332142829895
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,4096,1536,8,128,2,64,power_law_1.01,0.04262399971485138
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,4096,1536,8,128,2,64,power_law_1.01,0.06606720089912414
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,4096,1536,8,128,2,64,power_law_1.01,0.044512000679969785
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,4096,1536,8,128,2,64,power_law_1.01,0.04999040067195892
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,4096,1536,8,128,2,64,power_law_1.01,0.07836800217628478
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,4096,1536,8,128,2,64,power_law_1.01,0.05021439790725708
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,4096,1536,8,128,2,64,balanced,0.15627732872962952
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,4096,1536,8,128,2,64,power_law_1.01,0.09379199743270875
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,4096,1536,8,128,2,64,power_law_1.01,0.05786240100860596
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,4096,1536,8,128,2,64,power_law_1.01,0.11802879571914673
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,4096,1536,8,128,2,64,power_law_1.01,0.06983680129051209
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,4096,1536,8,128,2,64,balanced,0.037461332976818085
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,4096,1536,8,128,2,64,power_law_1.01,0.08056319952011108
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,4096,1536,8,128,2,64,balanced,0.21635200579961142
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,4096,1536,8,128,2,64,power_law_1.01,0.11250560283660889
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,4096,1536,8,128,2,64,balanced,0.040463998913764954
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,4096,1536,8,128,2,64,power_law_1.01,0.1047551989555359
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,4096,1536,8,128,2,64,power_law_1.01,0.135315203666687
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,4096,1536,8,128,2,64,power_law_1.01,0.11221120357513428
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,4096,1536,8,128,2,64,balanced,0.04170133173465729
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,4096,1536,8,128,2,64,power_law_1.01,0.16153600215911865
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,4096,1536,8,128,2,64,power_law_1.01,0.14097919464111328
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,4096,1536,8,128,2,64,power_law_1.01,0.15066239833831788
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,4096,1536,8,128,2,64,power_law_1.01,0.20487680435180664
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,4096,1536,8,128,2,64,power_law_1.01,0.23671040534973145
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,4096,1536,8,128,2,64,power_law_1.01,0.2777535915374756
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,4096,1536,8,128,2,64,power_law_1.01,0.2842623949050903
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,4096,1536,8,128,2,64,power_law_1.01,0.3479552030563354
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,4096,1536,8,128,2,64,power_law_1.01,0.4124608039855957
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,4096,1536,8,128,2,64,balanced,0.17692800362904867
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,4096,1536,8,128,2,64,power_law_1.01,0.5531263828277588
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,4096,1536,8,128,2,64,power_law_1.01,0.4933631896972656
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,4096,1536,8,128,2,64,balanced,0.05003199974695841
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,4096,1536,8,128,2,64,balanced,0.2635306715965271
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,4096,1536,8,128,2,64,power_law_1.01,0.6099391937255859
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,4096,1536,8,128,2,64,power_law_1.01,0.6161920070648194
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,4096,1536,8,128,2,64,power_law_1.01,1.0860159873962403
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,4096,1536,8,128,2,64,balanced,0.05690133571624756
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,4096,1536,8,128,2,64,power_law_1.01,1.0142527580261231
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,4096,1536,8,128,2,64,power_law_1.01,0.02733440101146698
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,4096,1536,8,128,2,64,power_law_1.01,2.0967744827270507
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,4096,1536,8,128,2,64,power_law_1.01,0.026924800872802735
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,4096,1536,8,128,2,64,power_law_1.01,2.0402559280395507
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,4096,1536,8,128,2,64,power_law_1.01,0.026815998554229736
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,4096,1536,8,128,2,64,power_law_1.01,0.028774398565292358
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,4096,1536,8,128,2,64,balanced,0.06994133194287618
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,4096,1536,8,128,2,64,power_law_1.01,0.02975359857082367
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,4096,1536,8,128,2,64,power_law_1.01,0.030611199140548707
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,4096,1536,8,128,2,64,balanced,0.07821333408355713
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,4096,1536,8,128,2,64,power_law_1.01,0.030937600135803222
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,4096,1536,8,128,2,64,balanced,0.3124319911003113
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,4096,1536,8,128,2,64,power_law_1.01,0.03078399896621704
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,4096,1536,8,128,2,64,power_law_1.01,0.031123200058937074
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,4096,1536,8,128,2,64,balanced,0.2577386697133382
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,4096,1536,8,128,2,64,power_law_1.01,0.031564798951148984
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,4096,1536,8,128,2,64,power_law_1.01,0.03369599878787995
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,4096,1536,8,128,2,64,power_law_1.01,0.035411199927330016
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,4096,1536,8,128,2,64,balanced,0.1029813289642334
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,4096,1536,8,128,2,64,power_law_1.01,0.036339199542999266
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,4096,1536,8,128,2,64,power_law_1.2,0.038252800703048706
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,4096,1536,8,128,2,64,power_law_1.01,0.03904640078544617
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,4096,1536,8,128,2,64,power_law_1.2,0.033344000577926636
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,4096,1536,8,128,2,64,power_law_1.01,0.045337599515914914
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,4096,1536,8,128,2,64,power_law_1.2,0.03470079898834229
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,4096,1536,8,128,2,64,power_law_1.01,0.05122560262680054
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,4096,1536,8,128,2,64,power_law_1.2,0.03653120100498199
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,4096,1536,8,128,2,64,power_law_1.2,0.036883199214935304
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,4096,1536,8,128,2,64,power_law_1.01,0.05925760269165039
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,4096,1536,8,128,2,64,power_law_1.2,0.034195199608802795
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,4096,1536,8,128,2,64,balanced,0.12275733550389607
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,4096,1536,8,128,2,64,balanced,0.47870934009552
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,4096,1536,8,128,2,64,power_law_1.01,0.07058560252189636
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,4096,1536,8,128,2,64,power_law_1.2,0.04102399945259094
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,4096,1536,8,128,2,64,power_law_1.01,0.08143360018730164
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,4096,1536,8,128,2,64,power_law_1.2,0.04447999894618988
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,4096,1536,8,128,2,64,power_law_1.2,0.044038400053977966
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,4096,1536,8,128,2,64,power_law_1.2,0.049369600415229795
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,4096,1536,8,128,2,64,power_law_1.01,0.09896960258483886
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,4096,1536,8,128,2,64,power_law_1.2,0.05061759948730469
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,4096,1536,8,128,2,64,power_law_1.01,0.14642560482025146
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,4096,1536,8,128,2,64,balanced,0.17400532960891724
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,4096,1536,8,128,2,64,power_law_1.2,0.0516543984413147
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,4096,1536,8,128,2,64,power_law_1.01,0.16524159908294678
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,4096,1536,8,128,2,64,power_law_1.2,0.052774399518966675
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,4096,1536,8,128,2,64,power_law_1.2,0.049747198820114136
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,4096,1536,8,128,2,64,power_law_1.01,0.20017919540405274
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,4096,1536,8,128,2,64,power_law_1.2,0.057529598474502563
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,4096,1536,8,128,2,64,power_law_1.2,0.06238719820976257
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,4096,1536,8,128,2,64,power_law_1.01,0.2682751893997192
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,4096,1536,8,128,2,64,power_law_1.2,0.06903679966926575
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,4096,1536,8,128,2,64,balanced,0.2180053393046061
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,4096,1536,8,128,2,64,power_law_1.2,0.10039680004119873
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,4096,1536,8,128,2,64,power_law_1.01,0.3840320110321045
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,4096,1536,8,128,2,64,power_law_1.2,0.1086400032043457
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,4096,1536,8,128,2,64,power_law_1.01,0.6407872200012207
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,4096,1536,8,128,2,64,balanced,0.46328532695770264
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,4096,1536,8,128,2,64,power_law_1.2,0.15843199491500853
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,4096,1536,8,128,2,64,power_law_1.2,0.13980159759521485
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,4096,1536,8,128,2,64,power_law_1.01,0.7682816028594971
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,4096,1536,8,128,2,64,power_law_1.2,0.18338559865951537
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,4096,1536,8,128,2,64,power_law_1.2,0.24883840084075928
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,4096,1536,8,128,2,64,power_law_1.2,0.3424639940261841
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,4096,1536,8,128,2,64,power_law_1.01,0.896339225769043
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,4096,1536,8,128,2,64,power_law_1.2,0.45012478828430175
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,4096,1536,8,128,2,64,power_law_1.01,1.5836480140686036
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,4096,1536,8,128,2,64,power_law_1.2,0.6337344169616699
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,4096,1536,8,128,2,64,balanced,0.26629867156346637
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,4096,1536,8,128,2,64,power_law_1.2,0.7929024219512939
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,4096,1536,8,128,2,64,power_law_1.01,2.960659217834473
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,4096,1536,8,128,2,64,power_law_1.2,1.0003328323364258
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,4096,1536,8,128,2,64,balanced,0.9131200313568115
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,4096,1536,8,128,2,64,power_law_1.2,1.685638427734375
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,4096,1536,8,128,2,64,power_law_1.2,4.344153594970703
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,4096,1536,8,128,2,64,balanced,0.426693320274353
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,4096,1536,8,128,2,64,power_law_1.2,0.03680639863014221
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,4096,1536,8,128,2,64,power_law_1.2,0.03544319868087768
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,4096,1536,8,128,2,64,power_law_1.2,0.03648639917373657
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,4096,1536,8,128,2,64,power_law_1.2,0.035846400260925296
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,4096,1536,8,128,2,64,power_law_1.2,0.03604480028152466
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,4096,1536,8,128,2,64,power_law_1.2,0.036313599348068236
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,4096,1536,8,128,2,64,power_law_1.2,0.036364799737930296
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,4096,1536,8,128,2,64,power_law_1.2,0.03726719915866852
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,4096,1536,8,128,2,64,power_law_1.2,0.03759360015392303
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,4096,1536,8,128,2,64,power_law_1.2,0.03837440013885498
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,4096,1536,8,128,2,64,power_law_1.2,0.041631999611854556
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,4096,1536,8,128,2,64,power_law_1.2,0.04211840033531189
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,4096,1536,8,128,2,64,power_law_1.2,0.04361599981784821
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,4096,1536,8,128,2,64,power_law_1.2,0.0455808013677597
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,4096,1536,8,128,2,64,power_law_1.2,0.05141760110855102
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,4096,1536,8,128,4,32,balanced,0.03336533407370249
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,4096,1536,8,128,2,64,power_law_1.2,0.05316479802131653
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,4096,1536,8,128,4,32,balanced,0.03312533348798752
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,4096,1536,8,128,2,64,balanced,0.8269333044687907
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,4096,1536,8,128,2,64,power_law_1.2,0.06362879872322083
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,4096,1536,8,128,4,32,balanced,0.030213333666324615
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,4096,1536,8,128,2,64,power_law_1.2,0.08042240142822266
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,4096,1536,8,128,4,32,balanced,0.03147733211517334
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,4096,1536,8,128,2,64,power_law_1.2,0.08909440040588379
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,4096,1536,8,128,2,64,power_law_1.2,0.027270400524139406
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,4096,1536,8,128,4,32,balanced,0.0377866675456365
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,4096,1536,8,128,4,32,balanced,0.039290666580200195
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,4096,1536,8,128,2,64,power_law_1.2,0.13200639486312865
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,4096,1536,8,128,2,64,power_law_1.2,0.026438400149345398
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,4096,1536,8,128,2,64,power_law_1.2,0.027251198887825012
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,4096,1536,8,128,4,32,balanced,0.03939199944337209
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,4096,1536,8,128,2,64,power_law_1.2,0.13141759634017944
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,4096,1536,8,128,2,64,power_law_1.2,0.02874239981174469
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,4096,1536,8,128,4,32,balanced,0.04022933294375738
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,4096,1536,8,128,2,64,power_law_1.2,0.02961280047893524
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,4096,1536,8,128,2,64,power_law_1.2,0.18205440044403076
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,4096,1536,8,128,2,64,power_law_1.2,0.030726400017738343
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,4096,1536,8,128,4,32,balanced,0.03979199876387914
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,4096,1536,8,128,2,64,power_law_1.2,0.20049281120300294
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,4096,1536,8,128,2,64,power_law_1.2,0.030707201361656188
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,4096,1536,8,128,4,32,balanced,0.03987200061480204
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,4096,1536,8,128,2,64,power_law_1.2,0.030943998694419862
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,4096,1536,8,128,2,64,power_law_1.2,0.31585280895233153
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,4096,1536,8,128,2,64,power_law_1.2,0.031327998638153075
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,4096,1536,8,128,4,32,balanced,0.04058666775623957
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,4096,1536,8,128,2,64,power_law_1.2,0.03218559920787811
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,4096,1536,8,128,2,64,power_law_1.2,0.3636543989181519
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,4096,1536,8,128,4,32,balanced,0.0415040006240209
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,4096,1536,8,128,2,64,power_law_1.2,0.03475840091705322
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,4096,1536,8,128,2,64,power_law_1.2,0.5958720207214355
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,4096,1536,8,128,4,32,balanced,0.04318933188915253
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,4096,1536,8,128,2,64,power_law_1.2,0.03637759983539581
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,4096,1536,8,128,2,64,power_law_1.2,0.03865599930286408
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,4096,1536,8,128,4,32,balanced,0.04301866888999939
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,4096,1536,8,128,2,64,power_law_1.2,0.7260543823242187
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,4096,1536,8,128,2,64,power_law_1.2,0.040300801396369934
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,4096,1536,8,128,4,32,balanced,0.046495998899141945
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,4096,1536,8,128,2,64,power_law_1.2,0.04958719909191132
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,4096,1536,8,128,2,64,power_law_1.2,0.9131967544555664
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,4096,1536,8,128,2,64,power_law_1.2,0.05682560205459595
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,4096,1536,8,128,4,32,balanced,0.04689066608746847
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,4096,1536,8,128,2,64,power_law_1.2,1.9224767684936523
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,4096,1536,8,128,4,32,balanced,0.048656001687049866
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,4096,1536,8,128,2,64,power_law_1.2,0.06716160178184509
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,4096,1536,8,128,2,64,power_law_1.2,2.9941503524780275
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,4096,1536,8,128,2,64,power_law_1.2,0.0904640018939972
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,4096,1536,8,128,4,32,balanced,0.05118933320045471
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,4096,1536,8,128,2,64,power_law_1.2,0.10602240562438965
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,4096,1536,8,128,4,32,balanced,0.052906667192777
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,4096,1536,8,128,4,32,balanced,0.06541333099206288
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,4096,1536,8,128,2,64,power_law_1.2,0.13619199991226197
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,4096,1536,8,128,2,64,power_law_1.2,0.1919808030128479
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,4096,1536,8,128,4,32,balanced,0.06211199859778086
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,4096,1536,8,128,2,64,power_law_1.2,0.24506878852844238
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,4096,1536,8,128,2,64,power_law_1.2,0.33685119152069093
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,4096,1536,8,128,4,32,balanced,0.07642666498819987
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,4096,1536,8,128,2,64,power_law_1.2,0.4893951892852783
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,4096,1536,8,128,4,32,balanced,0.07542400062084198
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,4096,1536,8,128,2,64,power_law_1.2,0.5236608028411865
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,4096,1536,8,128,2,64,power_law_1.2,0.908563232421875
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,4096,1536,8,128,4,32,balanced,0.0997173289457957
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,4096,1536,8,128,2,64,power_law_1.2,1.6960639953613281
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,4096,1536,8,128,2,64,power_law_1.2,2.0056640625
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,4096,1536,8,128,2,64,power_law_1.2,2.968601608276367
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,4096,1536,8,128,4,32,balanced,0.032629333436489105
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,4096,1536,8,128,4,32,balanced,0.1067626674969991
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,4096,1536,8,128,4,32,balanced,0.0317493329445521
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,4096,1536,8,128,2,64,power_law_1.2,6.523123168945313
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,4096,1536,8,128,4,32,balanced,0.03182400017976761
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,4096,1536,8,128,4,32,balanced,0.03472533325354258
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,4096,1536,8,128,4,32,balanced,0.03813866774241129
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,4096,1536,8,128,4,32,balanced,0.03689600030581156
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,4096,1536,8,128,4,32,balanced,0.03696000079313914
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,4096,1536,8,128,4,32,balanced,0.15839999914169312
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,4096,1536,8,128,4,32,balanced,0.03728000074625015
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,4096,1536,8,128,4,32,balanced,0.03721600025892258
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,4096,1536,8,128,4,32,balanced,0.03793599953254064
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,4096,1536,8,128,4,32,balanced,0.03833066672086716
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,4096,1536,8,128,4,32,balanced,0.038362666964530945
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,4096,1536,8,128,4,32,power_law_1.01,0.03518719971179962
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,4096,1536,8,128,4,32,power_law_1.01,0.042284798622131345
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,4096,1536,8,128,4,32,balanced,0.039247999588648476
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,4096,1536,8,128,4,32,power_law_1.01,0.03559040129184723
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,4096,1536,8,128,4,32,balanced,0.18156800667444864
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,4096,1536,8,128,4,32,power_law_1.01,0.035104000568389894
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,4096,1536,8,128,4,32,balanced,0.04037333279848099
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,4096,1536,8,128,4,32,power_law_1.01,0.031411200761795044
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,4096,1536,8,128,4,32,power_law_1.01,0.0324288010597229
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,4096,1536,8,128,4,32,balanced,0.042821332812309265
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,4096,1536,8,128,4,32,power_law_1.01,0.03547520041465759
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,4096,1536,8,128,4,32,power_law_1.01,0.03412480056285858
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,4096,1536,8,128,4,32,balanced,0.04275199770927429
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,4096,1536,8,128,4,32,power_law_1.01,0.038649600744247434
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,4096,1536,8,128,4,32,power_law_1.01,0.03551360070705414
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,4096,1536,8,128,4,32,power_law_1.01,0.039027199149131775
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,4096,1536,8,128,4,32,balanced,0.045184001326560974
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,4096,1536,8,128,4,32,balanced,0.02643200010061264
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,4096,1536,8,128,4,32,power_law_1.01,0.0361407995223999
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,4096,1536,8,128,4,32,power_law_1.01,0.03871999979019165
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,4096,1536,8,128,4,32,balanced,0.026608000199000042
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,4096,1536,8,128,4,32,balanced,0.04860800007979075
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,4096,1536,8,128,4,32,power_law_1.01,0.03625600039958954
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,4096,1536,8,128,4,32,power_law_1.01,0.04068480134010315
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,4096,1536,8,128,4,32,balanced,0.02682666728893916
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,4096,1536,8,128,4,32,balanced,0.053216000398000084
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,4096,1536,8,128,4,32,power_law_1.01,0.03705599904060364
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,4096,1536,8,128,4,32,power_law_1.01,0.04926080107688904
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,4096,1536,8,128,4,32,balanced,0.028698667883872986
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,4096,1536,8,128,4,32,balanced,0.21059733629226685
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,4096,1536,8,128,4,32,power_law_1.01,0.037510401010513304
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,4096,1536,8,128,4,32,power_law_1.01,0.04967679977416992
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,4096,1536,8,128,4,32,balanced,0.06898133456707001
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,4096,1536,8,128,4,32,balanced,0.03012266755104065
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,4096,1536,8,128,4,32,power_law_1.01,0.03815680146217346
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,4096,1536,8,128,4,32,power_law_1.01,0.05070080161094666
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,4096,1536,8,128,4,32,balanced,0.030938667555650074
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,4096,1536,8,128,4,32,power_law_1.01,0.03930880129337311
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,4096,1536,8,128,4,32,balanced,0.07367999851703644
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,4096,1536,8,128,4,32,balanced,0.031210665901501972
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,4096,1536,8,128,4,32,power_law_1.01,0.053395199775695804
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,4096,1536,8,128,4,32,power_law_1.01,0.040908798575401306
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,4096,1536,8,128,4,32,balanced,0.031210665901501972
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,4096,1536,8,128,4,32,power_law_1.01,0.05560320019721985
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,4096,1536,8,128,4,32,power_law_1.01,0.041817599534988405
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,4096,1536,8,128,4,32,balanced,0.09407466650009155
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,4096,1536,8,128,4,32,balanced,0.03143999973932902
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,4096,1536,8,128,4,32,power_law_1.01,0.048844799399375916
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,4096,1536,8,128,4,32,power_law_1.01,0.04216960072517395
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,4096,1536,8,128,4,32,balanced,0.03176533430814743
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,4096,1536,8,128,4,32,power_law_1.01,0.053907197713851926
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,4096,1536,8,128,4,32,power_law_1.01,0.0486847996711731
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,4096,1536,8,128,4,32,balanced,0.03221333275238673
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,4096,1536,8,128,4,32,balanced,0.10226133465766907
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,4096,1536,8,128,4,32,power_law_1.01,0.04829440116882324
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,4096,1536,8,128,4,32,power_law_1.01,0.05555199980735779
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,4096,1536,8,128,4,32,balanced,0.03306133300065994
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,4096,1536,8,128,4,32,power_law_1.01,0.054028797149658206
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,4096,1536,8,128,4,32,power_law_1.01,0.055212801694869994
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,4096,1536,8,128,4,32,balanced,0.03372266640265783
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,4096,1536,8,128,4,32,power_law_1.01,0.0656000018119812
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,4096,1536,8,128,4,32,power_law_1.01,0.06912639737129211
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,4096,1536,8,128,4,32,balanced,0.03417066733042399
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,4096,1536,8,128,4,32,balanced,0.13928533593813577
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,4096,1536,8,128,4,32,power_law_1.01,0.0772607982158661
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,4096,1536,8,128,4,32,power_law_1.01,0.0802623987197876
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,4096,1536,8,128,4,32,power_law_1.01,0.09201279878616334
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,4096,1536,8,128,4,32,power_law_1.01,0.09464960098266602
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,4096,1536,8,128,4,32,power_law_1.01,0.1068992018699646
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,4096,1536,8,128,4,32,balanced,0.31435199578603107
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,4096,1536,8,128,4,32,balanced,0.039034667114416756
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,4096,1536,8,128,4,32,power_law_1.01,0.10268800258636475
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,4096,1536,8,128,4,32,power_law_1.01,0.12997759580612184
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,4096,1536,8,128,4,32,balanced,0.03822399924198786
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,4096,1536,8,128,4,32,balanced,0.16394133369127908
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,4096,1536,8,128,4,32,power_law_1.01,0.12817920446395875
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,4096,1536,8,128,4,32,power_law_1.01,0.18007680177688598
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,4096,1536,8,128,4,32,power_law_1.01,0.17118079662323
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,4096,1536,8,128,4,32,power_law_1.01,0.2136512041091919
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,4096,1536,8,128,4,32,power_law_1.01,0.26232960224151614
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,4096,1536,8,128,4,32,power_law_1.01,0.20563199520111083
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,4096,1536,8,128,4,32,power_law_1.01,0.38962559700012206
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,4096,1536,8,128,4,32,power_law_1.01,0.23583359718322755
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,4096,1536,8,128,4,32,balanced,0.03977599988381068
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,4096,1536,8,128,4,32,power_law_1.01,0.5130239963531494
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,4096,1536,8,128,4,32,power_law_1.01,0.31288321018218995
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,4096,1536,8,128,4,32,balanced,0.23448532819747925
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,4096,1536,8,128,4,32,balanced,0.044154668847719826
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,4096,1536,8,128,4,32,power_law_1.01,0.5942848205566407
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,4096,1536,8,128,4,32,power_law_1.01,0.43697919845581057
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,4096,1536,8,128,4,32,power_law_1.01,1.1204480171203612
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,4096,1536,8,128,4,32,balanced,0.04757333298524221
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,4096,1536,8,128,4,32,power_law_1.01,0.5643136024475097
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,4096,1536,8,128,4,32,power_law_1.01,1.9267135620117188
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,4096,1536,8,128,4,32,power_law_1.01,0.8376959800720215
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,4096,1536,8,128,4,32,power_law_1.01,1.6275455474853515
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,4096,1536,8,128,4,32,balanced,0.05694933235645294
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,4096,1536,8,128,4,32,power_law_1.01,0.028595200181007384
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,4096,1536,8,128,4,32,power_law_1.01,0.027065598964691163
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,4096,1536,8,128,4,32,balanced,0.2932693362236023
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,4096,1536,8,128,4,32,balanced,0.06516266862551372
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,4096,1536,8,128,4,32,power_law_1.01,0.02687999904155731
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,4096,1536,8,128,4,32,power_law_1.01,0.029395198822021483
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,4096,1536,8,128,4,32,power_law_1.01,0.02975359857082367
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,4096,1536,8,128,4,32,power_law_1.01,0.030950400233268737
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,4096,1536,8,128,4,32,balanced,0.08260266482830048
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,4096,1536,8,128,4,32,power_law_1.01,0.031116798520088196
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,4096,1536,8,128,4,32,power_law_1.01,0.03146879971027374
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,4096,1536,8,128,4,32,power_law_1.01,0.03373439908027649
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,4096,1536,8,128,4,32,balanced,0.09410132964452107
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,4096,1536,8,128,4,32,power_law_1.01,0.03342080116271973
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,4096,1536,8,128,4,32,balanced,0.3511360088984172
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,4096,1536,8,128,4,32,power_law_1.01,0.03615359961986542
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,4096,1536,8,128,4,32,balanced,0.5666613181432089
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,4096,1536,8,128,4,32,power_law_1.01,0.037215998768806456
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,4096,1536,8,128,4,32,power_law_1.01,0.03956480026245117
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,4096,1536,8,128,4,32,power_law_1.2,0.037190398573875426
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,4096,1536,8,128,4,32,power_law_1.01,0.041875201463699344
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,4096,1536,8,128,4,32,power_law_1.2,0.03416320085525513
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,4096,1536,8,128,4,32,balanced,0.12706666191418967
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,4096,1536,8,128,4,32,power_law_1.2,0.03229439854621887
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,4096,1536,8,128,4,32,power_law_1.01,0.0448063999414444
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,4096,1536,8,128,4,32,power_law_1.2,0.0353408008813858
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,4096,1536,8,128,4,32,power_law_1.01,0.04999679923057556
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,4096,1536,8,128,4,32,power_law_1.2,0.03948160111904144
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,4096,1536,8,128,4,32,power_law_1.2,0.039801600575447085
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,4096,1536,8,128,4,32,power_law_1.01,0.057574397325515746
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,4096,1536,8,128,4,32,power_law_1.2,0.03856000006198883
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,4096,1536,8,128,4,32,power_law_1.01,0.07239680290222168
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,4096,1536,8,128,4,32,power_law_1.2,0.04715520143508911
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,4096,1536,8,128,4,32,power_law_1.01,0.08515840172767639
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,4096,1536,8,128,4,32,balanced,0.15562666455904642
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,4096,1536,8,128,4,32,power_law_1.2,0.04864639937877655
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,4096,1536,8,128,4,32,power_law_1.2,0.050246399641036985
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,4096,1536,8,128,4,32,power_law_1.01,0.0987712025642395
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,4096,1536,8,128,4,32,power_law_1.2,0.051660799980163576
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,4096,1536,8,128,4,32,power_law_1.01,0.12910079956054688
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,4096,1536,8,128,4,32,balanced,0.5362399816513062
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,4096,1536,8,128,4,32,power_law_1.2,0.05389440059661865
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,4096,1536,8,128,4,32,power_law_1.01,0.17146240472793578
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,4096,1536,8,128,4,32,power_law_1.2,0.05606399774551392
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,4096,1536,8,128,4,32,power_law_1.2,0.052767997980117796
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,4096,1536,8,128,4,32,power_law_1.01,0.22801918983459474
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,4096,1536,8,128,4,32,balanced,0.23185600837071738
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,4096,1536,8,128,4,32,power_law_1.2,0.05506560206413269
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,4096,1536,8,128,4,32,power_law_1.01,0.32690560817718506
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,4096,1536,8,128,4,32,power_law_1.2,0.05891839861869812
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,4096,1536,8,128,4,32,power_law_1.2,0.0686847984790802
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,4096,1536,8,128,4,32,power_law_1.01,0.3835200071334839
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,4096,1536,8,128,4,32,power_law_1.2,0.07909119725227357
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,4096,1536,8,128,4,32,power_law_1.2,0.04186240136623383
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,4096,1536,8,128,4,32,power_law_1.01,0.6013184070587159
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,4096,1536,8,128,4,32,power_law_1.2,0.09268479943275451
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,4096,1536,8,128,4,32,power_law_1.2,0.03374080061912536
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,4096,1536,8,128,4,32,power_law_1.2,0.12100479602813721
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,4096,1536,8,128,4,32,power_law_1.01,0.79683837890625
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,4096,1536,8,128,4,32,power_law_1.2,0.03346560001373291
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,4096,1536,8,128,4,32,power_law_1.2,0.11898880004882813
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,4096,1536,8,128,4,32,power_law_1.01,0.9190848350524903
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,4096,1536,8,128,4,32,balanced,0.3064799904823303
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,4096,1536,8,128,4,32,power_law_1.2,0.035724800825119016
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,4096,1536,8,128,4,32,power_law_1.2,0.15111039876937865
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,4096,1536,8,128,4,32,power_law_1.01,1.6325824737548829
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,4096,1536,8,128,4,32,power_law_1.2,0.03622399866580963
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,4096,1536,8,128,4,32,power_law_1.2,0.19508479833602904
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,4096,1536,8,128,4,32,power_law_1.2,0.036294400691986084
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,4096,1536,8,128,4,32,power_law_1.01,3.1804479598999023
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,4096,1536,8,128,4,32,power_law_1.2,0.310099196434021
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,4096,1536,8,128,4,32,power_law_1.2,0.036364799737930296
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,4096,1536,8,128,4,32,power_law_1.2,0.33503360748291017
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,4096,1536,8,128,4,32,power_law_1.2,0.03759360015392303
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,4096,1536,8,128,4,32,power_law_1.2,0.4978176116943359
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,4096,1536,8,128,4,32,power_law_1.2,0.03815680146217346
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,4096,1536,8,128,4,32,power_law_1.2,0.5613120079040528
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,4096,1536,8,128,4,32,power_law_1.2,0.038624000549316403
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,4096,1536,8,128,4,32,power_law_1.2,0.040550398826599124
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,4096,1536,8,128,4,32,power_law_1.2,1.063596820831299
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,4096,1536,8,128,4,32,balanced,0.3753173351287842
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,4096,1536,8,128,4,32,power_law_1.2,0.040940800309181215
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,4096,1536,8,128,4,32,power_law_1.2,2.2037567138671874
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,4096,1536,8,128,4,32,power_law_1.2,0.043007999658584595
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,4096,1536,8,128,4,32,power_law_1.2,3.2604606628417967
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,4096,1536,8,128,4,32,power_law_1.2,0.044486400485038755
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,4096,1536,8,128,4,32,power_law_1.2,0.04961279928684235
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,4096,1536,8,128,4,32,power_law_1.2,0.050732797384262084
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,4096,1536,8,128,4,32,balanced,1.0251359939575195
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,4096,1536,8,128,4,32,power_law_1.2,0.058956801891326904
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,4096,1536,8,128,4,32,power_law_1.2,0.0694271981716156
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,4096,1536,8,128,4,32,power_law_1.2,0.07747840285301208
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,4096,1536,8,128,4,32,power_law_1.2,0.10385279655456543
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,4096,1536,8,128,4,32,power_law_1.2,0.1148800015449524
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,4096,1536,8,128,4,32,power_law_1.2,0.17250560522079467
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,4096,1536,8,128,4,32,balanced,0.5772480169932047
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,4096,1536,8,128,4,32,power_law_1.2,0.18305920362472533
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,4096,1536,8,128,4,32,power_law_1.2,0.30037760734558105
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,4096,1536,8,128,4,32,power_law_1.2,0.3442944049835205
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,4096,1536,8,128,4,32,power_law_1.2,0.5401088237762451
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,4096,1536,8,128,4,32,power_law_1.2,0.7322944164276123
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,4096,1536,8,128,4,32,power_law_1.2,0.9789952278137207
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,4096,1536,8,128,4,32,power_law_1.2,1.373459243774414
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,4096,1536,8,128,4,32,power_law_1.2,2.9185728073120116
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,4096,1536,8,128,8,16,balanced,0.033573334415753685
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,4096,1536,8,128,8,16,balanced,0.02924799919128418
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,4096,1536,8,128,8,16,balanced,0.029477333029111225
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,4096,1536,8,128,4,32,power_law_1.2,0.028755199909210206
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,4096,1536,8,128,8,16,balanced,0.03176533430814743
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,4096,1536,8,128,4,32,power_law_1.2,0.027039998769760133
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,4096,1536,8,128,8,16,balanced,0.036746665835380554
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,4096,1536,8,128,4,32,power_law_1.2,0.026969599723815917
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,4096,1536,8,128,8,16,balanced,0.037685332198937736
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,4096,1536,8,128,4,32,power_law_1.2,0.029216000437736513
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,4096,1536,8,128,4,32,balanced,1.122106631596883
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,4096,1536,8,128,8,16,balanced,0.03910933434963226
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,4096,1536,8,128,8,16,balanced,0.03677866607904434
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,4096,1536,8,128,4,32,power_law_1.2,0.029657599329948426
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,4096,1536,8,128,8,16,balanced,0.03682666768630346
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,4096,1536,8,128,4,32,power_law_1.2,0.031116798520088196
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,4096,1536,8,128,8,16,balanced,0.03994666785001755
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,4096,1536,8,128,4,32,power_law_1.2,0.03134720027446747
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,4096,1536,8,128,8,16,balanced,0.03886933376391729
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,4096,1536,8,128,4,32,power_law_1.2,0.033190399408340454
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,4096,1536,8,128,8,16,balanced,0.038693333665529885
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,4096,1536,8,128,4,32,power_law_1.2,0.03383679986000061
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,4096,1536,8,128,8,16,balanced,0.03940266619126002
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,4096,1536,8,128,4,32,power_law_1.2,0.03400320112705231
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,4096,1536,8,128,8,16,balanced,0.03198933353026708
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,4096,1536,8,128,8,16,balanced,0.04872000217437744
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,4096,1536,8,128,4,32,power_law_1.2,0.03615359961986542
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,4096,1536,8,128,8,16,balanced,0.032069332897663116
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,4096,1536,8,128,4,32,power_law_1.2,0.03991039991378784
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,4096,1536,8,128,8,16,balanced,0.04696533580621084
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,4096,1536,8,128,8,16,balanced,0.03274133304754893
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,4096,1536,8,128,4,32,power_law_1.2,0.040915200114250184
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,4096,1536,8,128,8,16,balanced,0.04828799764315287
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,4096,1536,8,128,8,16,balanced,0.035317334036032356
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,4096,1536,8,128,4,32,power_law_1.2,0.043705600500106814
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,4096,1536,8,128,8,16,balanced,0.05120000243186951
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,4096,1536,8,128,8,16,balanced,0.039893334110577904
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,4096,1536,8,128,8,16,balanced,0.05508266886075338
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,4096,1536,8,128,8,16,balanced,0.03915733347336451
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,4096,1536,8,128,4,32,power_law_1.2,0.0474047988653183
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,4096,1536,8,128,8,16,balanced,0.039503999054431915
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,4096,1536,8,128,8,16,balanced,0.05579199890295664
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,4096,1536,8,128,4,32,power_law_1.2,0.04989440143108368
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,4096,1536,8,128,8,16,balanced,0.039520000418027244
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,4096,1536,8,128,8,16,balanced,0.0692799985408783
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,4096,1536,8,128,8,16,balanced,0.039333333571751915
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,4096,1536,8,128,4,32,power_law_1.2,0.06339200139045716
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,4096,1536,8,128,8,16,balanced,0.04030933231115341
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,4096,1536,8,128,8,16,balanced,0.06905599931875865
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,4096,1536,8,128,8,16,balanced,0.04084266722202301
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,4096,1536,8,128,4,32,power_law_1.2,0.07763199806213379
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,4096,1536,8,128,8,16,balanced,0.041002665956815086
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,4096,1536,8,128,4,32,power_law_1.2,0.09665279984474182
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,4096,1536,8,128,8,16,balanced,0.08644266923268636
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,4096,1536,8,128,8,16,balanced,0.041989331444104515
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,4096,1536,8,128,4,32,power_law_1.2,0.12431360483169555
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,4096,1536,8,128,8,16,balanced,0.043807998299598694
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,4096,1536,8,128,4,32,power_law_1.2,0.13982080221176146
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,4096,1536,8,128,8,16,balanced,0.04516266783078512
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,4096,1536,8,128,8,16,balanced,0.08539199829101562
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,4096,1536,8,128,8,16,balanced,0.04513599971930186
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,4096,1536,8,128,4,32,power_law_1.2,0.22013440132141113
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,4096,1536,8,128,8,16,balanced,0.04740266501903534
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,4096,1536,8,128,4,32,power_law_1.2,0.32140800952911375
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,4096,1536,8,128,8,16,balanced,0.11679466565450032
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,4096,1536,8,128,8,16,balanced,0.05163733164469401
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,4096,1536,8,128,4,32,power_law_1.2,0.47496957778930665
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,4096,1536,8,128,8,16,balanced,0.05700799822807312
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,4096,1536,8,128,4,32,power_law_1.2,0.6451968193054199
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,4096,1536,8,128,8,16,balanced,0.073253333568573
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,4096,1536,8,128,4,32,power_law_1.2,1.030790424346924
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,4096,1536,8,128,8,16,balanced,0.1341333289941152
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,4096,1536,8,128,8,16,balanced,0.08171733220418294
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,4096,1536,8,128,4,32,power_law_1.2,1.3353407859802247
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,4096,1536,8,128,8,16,balanced,0.026677332818508148
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,4096,1536,8,128,4,32,power_law_1.2,1.7962944030761718
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,4096,1536,8,128,8,16,balanced,0.10391466816266377
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,4096,1536,8,128,8,16,balanced,0.02678400029738744
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,4096,1536,8,128,4,32,power_law_1.2,2.782899284362793
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,4096,1536,8,128,8,16,balanced,0.027471999327341717
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,4096,1536,8,128,8,16,balanced,0.029445332785447437
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,4096,1536,8,128,8,16,balanced,0.032069332897663116
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,4096,1536,8,128,4,32,power_law_1.2,5.233561706542969
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,4096,1536,8,128,8,16,balanced,0.11432533462842305
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,4096,1536,8,128,8,16,balanced,0.20018666982650757
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,4096,1536,8,128,8,16,balanced,0.033039999504884086
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,4096,1536,8,128,8,16,balanced,0.03322133421897888
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,4096,1536,8,128,8,16,balanced,0.033376000821590424
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,4096,1536,8,128,8,16,balanced,0.03387733300526937
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,4096,1536,8,128,8,16,balanced,0.034490667283535004
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,4096,1536,8,128,8,16,balanced,0.15980266531308493
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,4096,1536,8,128,8,16,balanced,0.03483733286460241
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,4096,1536,8,128,8,16,balanced,0.03611200054486593
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,4096,1536,8,128,8,16,balanced,0.03686933219432831
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,4096,1536,8,128,8,16,balanced,0.03738666574160258
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,4096,1536,8,128,8,16,balanced,0.23322133223215738
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,4096,1536,8,128,8,16,balanced,0.1930613319079081
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,4096,1536,8,128,8,16,power_law_1.01,0.04439679980278015
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,4096,1536,8,128,8,16,power_law_1.01,0.04131839871406555
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,4096,1536,8,128,8,16,balanced,0.042863999803860985
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,4096,1536,8,128,8,16,balanced,0.042303999265034996
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,4096,1536,8,128,8,16,power_law_1.01,0.03173120021820068
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,4096,1536,8,128,8,16,power_law_1.01,0.03581439852714539
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,4096,1536,8,128,8,16,power_law_1.01,0.030873599648475646
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,4096,1536,8,128,8,16,power_law_1.01,0.03247359991073608
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,4096,1536,8,128,8,16,power_law_1.01,0.03495039939880371
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,4096,1536,8,128,8,16,power_law_1.01,0.03898879885673523
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,4096,1536,8,128,8,16,power_law_1.01,0.03805440068244934
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,4096,1536,8,128,8,16,power_law_1.01,0.03473280072212219
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,4096,1536,8,128,8,16,balanced,0.045552000403404236
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,4096,1536,8,128,8,16,power_law_1.01,0.038361600041389464
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,4096,1536,8,128,8,16,balanced,0.2822879950205485
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,4096,1536,8,128,8,16,power_law_1.01,0.03711360096931458
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,4096,1536,8,128,8,16,balanced,0.05230399966239929
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,4096,1536,8,128,8,16,power_law_1.01,0.03818880021572113
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,4096,1536,8,128,8,16,power_law_1.01,0.03557760119438171
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,4096,1536,8,128,8,16,power_law_1.01,0.03898879885673523
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,4096,1536,8,128,8,16,balanced,0.05710933109124502
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,4096,1536,8,128,8,16,power_law_1.01,0.037785598635673524
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,4096,1536,8,128,8,16,balanced,0.2836586634318034
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,4096,1536,8,128,8,16,power_law_1.01,0.03930880129337311
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,4096,1536,8,128,8,16,power_law_1.01,0.040479999780654904
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,4096,1536,8,128,8,16,power_law_1.01,0.04079360067844391
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,4096,1536,8,128,8,16,power_law_1.01,0.0458624005317688
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,4096,1536,8,128,8,16,balanced,0.07254933317502339
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,4096,1536,8,128,8,16,power_law_1.01,0.04221439957618713
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,4096,1536,8,128,8,16,power_law_1.01,0.0468095988035202
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,4096,1536,8,128,8,16,power_law_1.01,0.04320000112056732
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,4096,1536,8,128,8,16,balanced,0.08225599924723308
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,4096,1536,8,128,8,16,power_law_1.01,0.05041279792785645
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,4096,1536,8,128,8,16,power_law_1.01,0.04563199877738953
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,4096,1536,8,128,8,16,balanced,0.35944000879923504
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,4096,1536,8,128,8,16,power_law_1.01,0.050367999076843264
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,4096,1536,8,128,8,16,power_law_1.01,0.044972801208496095
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,4096,1536,8,128,8,16,power_law_1.01,0.04950399994850159
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,4096,1536,8,128,8,16,power_law_1.01,0.04910080134868622
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,4096,1536,8,128,8,16,power_law_1.01,0.051475197076797485
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,4096,1536,8,128,8,16,power_law_1.01,0.05263360142707825
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,4096,1536,8,128,8,16,balanced,0.10823466380437215
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,4096,1536,8,128,8,16,power_law_1.01,0.03331199884414673
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,4096,1536,8,128,8,16,power_law_1.01,0.05607680082321167
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,4096,1536,8,128,8,16,power_law_1.01,0.057120001316070555
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,4096,1536,8,128,8,16,power_law_1.01,0.07023360133171082
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,4096,1536,8,128,8,16,power_law_1.01,0.028249600529670717
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,4096,1536,8,128,8,16,power_law_1.01,0.06395519971847534
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,4096,1536,8,128,8,16,balanced,0.12642666697502136
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,4096,1536,8,128,8,16,power_law_1.01,0.07523840069770812
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,4096,1536,8,128,8,16,power_law_1.01,0.028147199749946596
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,4096,1536,8,128,8,16,power_law_1.01,0.07729920148849487
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,4096,1536,8,128,8,16,power_law_1.01,0.09665279984474182
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,4096,1536,8,128,8,16,power_law_1.01,0.030707201361656188
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,4096,1536,8,128,8,16,power_law_1.01,0.07720320224761963
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,4096,1536,8,128,8,16,power_law_1.01,0.11028480529785156
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,4096,1536,8,128,8,16,power_law_1.01,0.03158400058746338
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,4096,1536,8,128,8,16,balanced,0.43348264694213867
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,4096,1536,8,128,8,16,power_law_1.01,0.09290239810943604
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,4096,1536,8,128,8,16,balanced,0.4151839812596639
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,4096,1536,8,128,8,16,power_law_1.01,0.14588160514831544
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,4096,1536,8,128,8,16,power_law_1.01,0.03320319950580597
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,4096,1536,8,128,8,16,power_law_1.01,0.1034432053565979
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,4096,1536,8,128,8,16,power_law_1.01,0.15790719985961915
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,4096,1536,8,128,8,16,power_law_1.01,0.034176000952720643
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,4096,1536,8,128,8,16,balanced,0.18251200517018637
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,4096,1536,8,128,8,16,power_law_1.01,0.12268799543380737
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,4096,1536,8,128,8,16,power_law_1.01,0.03489919900894165
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,4096,1536,8,128,8,16,power_law_1.01,0.22513279914855958
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,4096,1536,8,128,8,16,power_law_1.01,0.14323840141296387
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,4096,1536,8,128,8,16,power_law_1.01,0.03470079898834229
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,4096,1536,8,128,8,16,power_law_1.01,0.2914560079574585
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,4096,1536,8,128,8,16,power_law_1.01,0.19783040285110473
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,4096,1536,8,128,8,16,power_law_1.01,0.036774399876594546
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,4096,1536,8,128,8,16,power_law_1.01,0.4192768096923828
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,4096,1536,8,128,8,16,power_law_1.01,0.236678409576416
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,4096,1536,8,128,8,16,power_law_1.01,0.038099199533462524
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,4096,1536,8,128,8,16,power_law_1.01,0.33562240600585935
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,4096,1536,8,128,8,16,power_law_1.01,0.04134399890899658
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,4096,1536,8,128,8,16,power_law_1.01,0.5631487846374512
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,4096,1536,8,128,8,16,power_law_1.01,0.04397439956665039
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,4096,1536,8,128,8,16,power_law_1.01,0.42427520751953124
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,4096,1536,8,128,8,16,power_law_1.01,0.7403200149536133
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,4096,1536,8,128,8,16,balanced,0.24587732553482056
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,4096,1536,8,128,8,16,power_law_1.01,0.048492801189422605
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,4096,1536,8,128,8,16,power_law_1.01,0.5746560096740723
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,4096,1536,8,128,8,16,power_law_1.01,1.1026880264282226
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,4096,1536,8,128,8,16,power_law_1.01,0.05128960013389587
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,4096,1536,8,128,8,16,power_law_1.01,0.9193471908569336
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,4096,1536,8,128,8,16,power_law_1.01,2.2299327850341797
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,4096,1536,8,128,8,16,power_law_1.01,0.05482879877090454
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,4096,1536,8,128,8,16,power_law_1.01,1.6891263961791991
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,4096,1536,8,128,8,16,balanced,0.6532479921976725
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,4096,1536,8,128,8,16,balanced,0.35814932982126874
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,4096,1536,8,128,8,16,power_law_1.01,0.06389120221138
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,4096,1536,8,128,8,16,power_law_1.2,0.04239999949932098
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,4096,1536,8,128,8,16,power_law_1.01,0.08051199913024902
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,4096,1536,8,128,8,16,power_law_1.2,0.029478400945663452
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,4096,1536,8,128,8,16,power_law_1.01,0.0883072018623352
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,4096,1536,8,128,8,16,power_law_1.2,0.03159680068492889
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,4096,1536,8,128,8,16,power_law_1.2,0.0398144006729126
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,4096,1536,8,128,8,16,power_law_1.01,0.11829760074615478
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,4096,1536,8,128,8,16,power_law_1.01,0.1353279948234558
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,4096,1536,8,128,8,16,power_law_1.2,0.035308799147605895
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,4096,1536,8,128,8,16,balanced,0.4607786734898885
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,4096,1536,8,128,8,16,power_law_1.2,0.03694080114364624
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,4096,1536,8,128,8,16,power_law_1.01,0.1854591965675354
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,4096,1536,8,128,8,16,power_law_1.2,0.0377344012260437
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,4096,1536,8,128,8,16,power_law_1.01,0.2679231882095337
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,4096,1536,8,128,8,16,power_law_1.2,0.039776000380516055
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,4096,1536,8,128,8,16,power_law_1.01,0.33775360584259034
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,4096,1536,8,128,8,16,power_law_1.2,0.04344959855079651
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,4096,1536,8,128,8,16,power_law_1.2,0.047731199860572816
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,4096,1536,8,128,8,16,balanced,0.7998826503753662
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,4096,1536,8,128,8,16,power_law_1.2,0.04880639910697937
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,4096,1536,8,128,8,16,power_law_1.01,0.4743167877197266
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,4096,1536,8,128,8,16,power_law_1.2,0.05182719826698303
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,4096,1536,8,128,8,16,power_law_1.01,0.7158336162567138
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,4096,1536,8,128,8,16,balanced,0.5641119877497355
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,4096,1536,8,128,8,16,power_law_1.2,0.051667201519012454
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,4096,1536,8,128,8,16,power_law_1.01,1.103756809234619
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,4096,1536,8,128,8,16,power_law_1.2,0.04965119957923889
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,4096,1536,8,128,8,16,power_law_1.01,1.1106623649597167
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,4096,1536,8,128,8,16,power_law_1.2,0.05383679866790771
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,4096,1536,8,128,8,16,power_law_1.01,1.6947263717651366
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,4096,1536,8,128,8,16,power_law_1.2,0.05726720094680786
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,4096,1536,8,128,8,16,power_law_1.2,0.06262400150299072
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,4096,1536,8,128,8,16,power_law_1.01,3.268339157104492
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,4096,1536,8,128,8,16,power_law_1.2,0.07772799730300903
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,4096,1536,8,128,8,16,power_law_1.2,0.08191360235214233
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,4096,1536,8,128,8,16,power_law_1.2,0.10181119441986083
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,4096,1536,8,128,8,16,balanced,1.270896037419637
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,4096,1536,8,128,8,16,power_law_1.2,0.12239359617233277
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,4096,1536,8,128,8,16,power_law_1.2,0.15419520139694215
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,4096,1536,8,128,8,16,balanced,0.8819413185119629
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,4096,1536,8,128,8,16,power_law_1.2,0.16019200086593627
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,4096,1536,8,128,8,16,power_law_1.2,0.20901761054992676
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,4096,1536,8,128,8,16,power_law_1.2,0.04255360066890716
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,4096,1536,8,128,8,16,power_law_1.2,0.26150400638580323
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,4096,1536,8,128,8,16,power_law_1.2,0.032927998900413515
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,4096,1536,8,128,8,16,power_law_1.2,0.42891521453857423
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,4096,1536,8,128,8,16,power_law_1.2,0.033011201024055484
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,4096,1536,8,128,8,16,power_law_1.2,0.6257855892181396
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,4096,1536,8,128,8,16,power_law_1.2,0.035776001214981076
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,4096,1536,8,128,8,16,power_law_1.2,0.648742389678955
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,4096,1536,8,128,8,16,power_law_1.2,0.03717760145664215
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,4096,1536,8,128,8,16,power_law_1.2,1.3209152221679688
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,4096,1536,8,128,8,16,power_law_1.2,0.038073599338531494
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,4096,1536,8,128,8,16,power_law_1.2,0.03873920142650604
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,4096,1536,8,128,8,16,power_law_1.2,2.694668769836426
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,4096,1536,8,128,8,16,power_law_1.2,0.0400191992521286
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,4096,1536,8,128,8,16,power_law_1.2,0.03999359905719757
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,4096,1536,8,128,8,16,power_law_1.2,0.0409855991601944
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,4096,1536,8,128,8,16,power_law_1.2,0.043699198961257936
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,4096,1536,8,128,8,16,power_law_1.2,0.04411520063877106
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,4096,1536,8,128,8,16,power_law_1.2,0.04709759950637817
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,4096,1536,8,128,8,16,power_law_1.2,0.04588159918785095
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,4096,1536,8,128,8,16,power_law_1.2,0.05183359980583191
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,4096,1536,8,128,8,16,power_law_1.2,0.05223039984703064
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,4096,1536,8,128,8,16,power_law_1.2,0.05999360084533691
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,4096,1536,8,128,8,16,balanced,1.7304479281107585
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,4096,1536,8,128,8,16,power_law_1.2,0.07568640112876893
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,4096,1536,8,128,8,16,power_law_1.2,0.08157439827919007
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,4096,1536,8,128,8,16,power_law_1.2,0.10727039575576783
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,4096,1536,8,128,8,16,power_law_1.2,0.11891839504241944
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,4096,1536,8,128,8,16,power_law_1.2,0.14762239456176757
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,4096,1536,8,128,8,16,power_law_1.2,0.19274239540100097
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,4096,1536,8,128,8,16,power_law_1.2,0.2789184093475342
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,4096,1536,8,128,8,16,power_law_1.2,0.33591039180755616
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,4096,1536,8,128,8,16,power_law_1.2,0.4985983848571777
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,4096,1536,8,128,8,16,power_law_1.2,0.7479104042053223
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,4096,1536,8,128,8,16,power_law_1.2,1.1220671653747558
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,4096,1536,8,128,8,16,power_law_1.2,1.7014591217041015
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,4096,1536,8,128,8,16,power_law_1.2,2.9465215682983397
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,4096,1536,8,128,16,8,balanced,0.03531199942032496
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,4096,1536,8,128,16,8,balanced,0.03365333378314972
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,4096,1536,8,128,8,16,power_law_1.2,0.03298560082912445
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,4096,1536,8,128,16,8,balanced,0.034501334031422935
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,4096,1536,8,128,8,16,power_law_1.2,0.02800639867782593
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,4096,1536,8,128,16,8,balanced,0.041722665230433144
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,4096,1536,8,128,8,16,power_law_1.2,0.02791680097579956
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,4096,1536,8,128,16,8,balanced,0.04137066751718521
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,4096,1536,8,128,8,16,power_law_1.2,0.030803200602531434
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,4096,1536,8,128,16,8,balanced,0.04229333500067393
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,4096,1536,8,128,16,8,balanced,0.04246933261553446
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,4096,1536,8,128,8,16,power_law_1.2,0.03192319869995117
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,4096,1536,8,128,16,8,balanced,0.04350399971008301
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,4096,1536,8,128,8,16,power_law_1.2,0.03333759903907776
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,4096,1536,8,128,16,8,balanced,0.043285335103670754
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,4096,1536,8,128,8,16,power_law_1.2,0.034272000193595886
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,4096,1536,8,128,16,8,balanced,0.043162668744723
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,4096,1536,8,128,16,8,balanced,0.044218664367993675
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,4096,1536,8,128,8,16,power_law_1.2,0.036160001158714296
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,4096,1536,8,128,16,8,balanced,0.04677866895993551
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,4096,1536,8,128,8,16,power_law_1.2,0.03658879995346069
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,4096,1536,8,128,16,8,balanced,0.04728533327579498
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,4096,1536,8,128,16,8,balanced,0.032272001107533775
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,4096,1536,8,128,8,16,power_law_1.2,0.03709439933300018
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,4096,1536,8,128,16,8,balanced,0.04837333162625631
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,4096,1536,8,128,16,8,balanced,0.03268266717592875
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,4096,1536,8,128,8,16,power_law_1.2,0.03943040072917938
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,4096,1536,8,128,16,8,balanced,0.05212266743183136
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,4096,1536,8,128,16,8,balanced,0.03316266586383184
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,4096,1536,8,128,8,16,power_law_1.2,0.041555199027061465
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,4096,1536,8,128,16,8,balanced,0.052704001466433205
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,4096,1536,8,128,16,8,balanced,0.03584533433119456
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,4096,1536,8,128,8,16,power_law_1.2,0.045075199007987975
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,4096,1536,8,128,16,8,balanced,0.03974399964014689
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,4096,1536,8,128,16,8,balanced,0.05773333211739858
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,4096,1536,8,128,8,16,power_law_1.2,0.04837760031223297
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,4096,1536,8,128,16,8,balanced,0.04085866610209147
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,4096,1536,8,128,16,8,balanced,0.06460266808668773
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,4096,1536,8,128,16,8,balanced,0.04116799930731455
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,4096,1536,8,128,8,16,power_law_1.2,0.05485439896583557
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,4096,1536,8,128,16,8,balanced,0.04123199979464213
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,4096,1536,8,128,16,8,balanced,0.06645866731802623
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,4096,1536,8,128,8,16,power_law_1.2,0.05454720258712768
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,4096,1536,8,128,16,8,balanced,0.04144533226887385
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,4096,1536,8,128,16,8,balanced,0.04200000067551931
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,4096,1536,8,128,16,8,balanced,0.07434666653474171
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,4096,1536,8,128,16,8,balanced,0.042447999119758606
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,4096,1536,8,128,8,16,power_law_1.2,0.0648639976978302
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,4096,1536,8,128,16,8,balanced,0.04262933135032654
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,4096,1536,8,128,16,8,balanced,0.07975466549396515
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,4096,1536,8,128,16,8,balanced,0.043791999419530235
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,4096,1536,8,128,8,16,power_law_1.2,0.08524159789085388
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,4096,1536,8,128,16,8,balanced,0.044677332043647766
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,4096,1536,8,128,8,16,power_law_1.2,0.09722880125045777
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,4096,1536,8,128,16,8,balanced,0.10063999891281128
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,4096,1536,8,128,16,8,balanced,0.04947733382383982
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,4096,1536,8,128,16,8,balanced,0.04971733192602793
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,4096,1536,8,128,8,16,power_law_1.2,0.12318079471588135
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,4096,1536,8,128,16,8,power_law_1.01,0.038387200236320494
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,4096,1536,8,128,16,8,balanced,0.052986666560173035
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,4096,1536,8,128,16,8,balanced,0.11213866869608562
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,4096,1536,8,128,8,16,power_law_1.2,0.16286079883575438
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,4096,1536,8,128,16,8,power_law_1.01,0.036723199486732486
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,4096,1536,8,128,16,8,balanced,0.06004266440868378
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,4096,1536,8,128,16,8,power_law_1.01,0.036748799681663516
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,4096,1536,8,128,16,8,balanced,0.0680266668399175
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,4096,1536,8,128,8,16,power_law_1.2,0.24350719451904296
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,4096,1536,8,128,16,8,power_law_1.01,0.04195840060710907
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,4096,1536,8,128,16,8,balanced,0.16273599863052368
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,4096,1536,8,128,8,16,power_law_1.2,0.30741760730743406
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,4096,1536,8,128,16,8,power_law_1.01,0.040934398770332336
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,4096,1536,8,128,16,8,balanced,0.08050133287906647
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,4096,1536,8,128,16,8,power_law_1.01,0.04460160136222839
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,4096,1536,8,128,16,8,power_law_1.01,0.04408319890499115
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,4096,1536,8,128,16,8,balanced,0.09128000338872273
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,4096,1536,8,128,8,16,power_law_1.2,0.46094717979431155
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,4096,1536,8,128,16,8,power_law_1.01,0.04525440037250519
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,4096,1536,8,128,16,8,power_law_1.01,0.04459519982337952
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,4096,1536,8,128,16,8,balanced,0.20037867625554404
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,4096,1536,8,128,8,16,power_law_1.2,0.6815040111541748
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,4096,1536,8,128,16,8,balanced,0.12337600191434224
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,4096,1536,8,128,16,8,power_law_1.01,0.04529919922351837
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,4096,1536,8,128,8,16,power_law_1.2,0.9760319709777832
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,4096,1536,8,128,16,8,power_law_1.01,0.04880000054836273
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,4096,1536,8,128,16,8,power_law_1.01,0.05116159915924072
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,4096,1536,8,128,8,16,power_law_1.2,1.3442496299743651
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,4096,1536,8,128,16,8,balanced,0.14054399728775024
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,4096,1536,8,128,16,8,power_law_1.01,0.052223998308181765
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,4096,1536,8,128,8,16,power_law_1.2,1.7410367965698241
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,4096,1536,8,128,16,8,power_law_1.01,0.05618559718132019
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,4096,1536,8,128,16,8,power_law_1.01,0.03504000008106232
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,4096,1536,8,128,16,8,power_law_1.01,0.06042879819869995
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,4096,1536,8,128,8,16,power_law_1.2,2.9680896759033204
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,4096,1536,8,128,16,8,balanced,0.29155200719833374
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,4096,1536,8,128,16,8,balanced,0.2037013371785482
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,4096,1536,8,128,16,8,power_law_1.01,0.03270399868488312
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,4096,1536,8,128,16,8,power_law_1.01,0.061977601051330565
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,4096,1536,8,128,16,8,power_law_1.01,0.033228799700737
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,4096,1536,8,128,16,8,power_law_1.01,0.06524800062179566
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,4096,1536,8,128,8,16,power_law_1.2,8.620262145996094
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,4096,1536,8,128,16,8,power_law_1.01,0.036108800768852235
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,4096,1536,8,128,16,8,power_law_1.01,0.0754047989845276
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,4096,1536,8,128,16,8,power_law_1.01,0.03687039911746979
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,4096,1536,8,128,16,8,power_law_1.01,0.08144000172615051
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,4096,1536,8,128,16,8,balanced,0.259168008963267
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,4096,1536,8,128,16,8,power_law_1.01,0.04043520092964172
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,4096,1536,8,128,16,8,power_law_1.01,0.09900799989700318
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,4096,1536,8,128,16,8,power_law_1.01,0.04103679955005646
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,4096,1536,8,128,16,8,power_law_1.01,0.10234240293502808
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,4096,1536,8,128,16,8,power_law_1.01,0.0412416011095047
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,4096,1536,8,128,16,8,power_law_1.01,0.1561344027519226
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,4096,1536,8,128,16,8,balanced,0.38255465030670166
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,4096,1536,8,128,16,8,power_law_1.01,0.04257920086383819
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,4096,1536,8,128,16,8,power_law_1.01,0.16600960493087769
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,4096,1536,8,128,16,8,power_law_1.01,0.042931199073791504
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,4096,1536,8,128,16,8,power_law_1.01,0.22544639110565184
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,4096,1536,8,128,16,8,balanced,0.3806026776631673
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,4096,1536,8,128,16,8,power_law_1.01,0.04609920084476471
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,4096,1536,8,128,16,8,power_law_1.01,0.2797760009765625
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,4096,1536,8,128,16,8,power_law_1.01,0.047040000557899475
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,4096,1536,8,128,16,8,power_law_1.01,0.4104640007019043
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,4096,1536,8,128,16,8,power_law_1.01,0.050419199466705325
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,4096,1536,8,128,16,8,power_law_1.01,0.5484416007995605
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,4096,1536,8,128,16,8,power_law_1.01,0.050432002544403075
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,4096,1536,8,128,16,8,power_law_1.01,0.7398399829864502
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,4096,1536,8,128,16,8,power_law_1.01,0.055270397663116456
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,4096,1536,8,128,16,8,power_law_1.01,1.0367039680480956
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,4096,1536,8,128,16,8,power_law_1.01,0.058432000875473025
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,4096,1536,8,128,16,8,power_law_1.01,0.06355839967727661
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,4096,1536,8,128,16,8,balanced,0.4764053424199422
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,4096,1536,8,128,16,8,balanced,0.4607679843902588
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,4096,1536,8,128,16,8,power_law_1.01,2.3070335388183594
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,4096,1536,8,128,16,8,power_law_1.01,0.0710591971874237
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,4096,1536,8,128,16,8,power_law_1.01,0.08765439987182617
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,4096,1536,8,128,16,8,power_law_1.01,0.10759040117263793
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,4096,1536,8,128,16,8,power_law_1.01,0.12314239740371705
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,4096,1536,8,128,16,8,power_law_1.2,0.03831680119037628
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,4096,1536,8,128,16,8,power_law_1.01,0.16331520080566406
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,4096,1536,8,128,16,8,power_law_1.2,0.03472639918327332
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,4096,1536,8,128,16,8,power_law_1.2,0.03641600012779236
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,4096,1536,8,128,16,8,power_law_1.01,0.19545600414276124
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,4096,1536,8,128,16,8,power_law_1.2,0.040217599272727965
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,4096,1536,8,128,16,8,power_law_1.2,0.038227200508117676
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,4096,1536,8,128,16,8,power_law_1.01,0.2809279918670654
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,4096,1536,8,128,16,8,power_law_1.2,0.04449920058250427
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,4096,1536,8,128,16,8,balanced,0.5907573302586874
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,4096,1536,8,128,16,8,power_law_1.2,0.044223999977111815
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,4096,1536,8,128,16,8,power_law_1.01,0.3295680046081543
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,4096,1536,8,128,16,8,power_law_1.2,0.045510399341583255
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,4096,1536,8,128,16,8,power_law_1.2,0.04624640047550201
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,4096,1536,8,128,16,8,power_law_1.01,0.5489855766296386
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,4096,1536,8,128,16,8,power_law_1.2,0.046758401393890384
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,4096,1536,8,128,16,8,power_law_1.01,0.6402751922607421
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,4096,1536,8,128,16,8,power_law_1.2,0.05076479911804199
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,4096,1536,8,128,16,8,power_law_1.01,0.9149439811706543
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,4096,1536,8,128,16,8,power_law_1.2,0.051507198810577394
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,4096,1536,8,128,16,8,balanced,0.6522719860076904
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,4096,1536,8,128,16,8,power_law_1.2,0.05232639908790589
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,4096,1536,8,128,16,8,power_law_1.01,1.2727487564086915
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,4096,1536,8,128,16,8,power_law_1.2,0.055871999263763426
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,4096,1536,8,128,16,8,power_law_1.2,0.060236799716949466
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,4096,1536,8,128,16,8,power_law_1.01,2.585260772705078
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,4096,1536,8,128,16,8,power_law_1.2,0.06307839751243591
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,4096,1536,8,128,16,8,power_law_1.2,0.06857600212097167
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,4096,1536,8,128,16,8,power_law_1.2,0.08001279830932617
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,4096,1536,8,128,16,8,power_law_1.2,0.08210560083389282
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,4096,1536,8,128,16,8,power_law_1.2,0.10065280199050904
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,4096,1536,8,128,16,8,power_law_1.2,0.12408319711685181
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,4096,1536,8,128,16,8,power_law_1.2,0.16475520133972169
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,4096,1536,8,128,16,8,power_law_1.2,0.18360960483551025
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,4096,1536,8,128,16,8,balanced,0.8993972937266032
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,4096,1536,8,128,16,8,power_law_1.2,0.2711424112319946
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,4096,1536,8,128,16,8,power_law_1.2,0.3988480091094971
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,4096,1536,8,128,16,8,power_law_1.2,0.5501247882843018
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,4096,1536,8,128,16,8,power_law_1.2,0.7314815998077393
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,4096,1536,8,128,16,8,power_law_1.2,0.9078528404235839
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,4096,1536,8,128,16,8,power_law_1.2,1.6198400497436523
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,4096,1536,8,128,16,8,power_law_1.2,3.074278450012207
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,4096,1536,8,128,16,8,balanced,1.2667413552602131
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,4096,1536,8,128,16,8,balanced,1.7830932935078938
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,4096,1536,8,128,16,8,power_law_1.2,0.034995201230049136
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,4096,1536,8,128,16,8,power_law_1.2,0.03191039860248566
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,4096,1536,8,128,16,8,power_law_1.2,0.03357439935207367
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,4096,1536,8,128,16,8,power_law_1.2,0.036006399989128114
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,4096,1536,8,128,16,8,power_law_1.2,0.037363201379776
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,4096,1536,8,128,16,8,power_law_1.2,0.04081920087337494
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,4096,1536,8,128,16,8,power_law_1.2,0.041043201088905336
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,4096,1536,8,128,16,8,power_law_1.2,0.042284798622131345
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,4096,1536,8,128,16,8,power_law_1.2,0.04251520037651062
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,4096,1536,8,128,16,8,power_law_1.2,0.04371840059757233
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,4096,1536,8,128,16,8,power_law_1.2,0.046387198567390445
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,4096,1536,8,128,16,8,power_law_1.2,0.04869759976863861
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,4096,1536,8,128,16,8,power_law_1.2,0.050348800420761106
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,4096,1536,8,128,16,8,power_law_1.2,0.05184000134468079
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,4096,1536,8,128,16,8,power_law_1.2,0.057766401767730714
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,4096,1536,8,128,16,8,power_law_1.2,0.05923839807510376
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,4096,1536,8,128,16,8,power_law_1.2,0.06595199704170226
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,4096,1536,8,128,32,4,balanced,0.03499733408292135
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,4096,1536,8,128,16,8,power_law_1.2,0.07536640167236328
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,4096,1536,8,128,16,8,power_law_1.2,0.09128959774971009
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,4096,1536,8,128,32,4,balanced,0.03507733345031738
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,4096,1536,8,128,32,4,balanced,0.036858665446440377
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,4096,1536,8,128,16,8,power_law_1.2,0.11222399473190307
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,4096,1536,8,128,32,4,balanced,0.0468746672074
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,4096,1536,8,128,16,8,power_law_1.2,0.1313024044036865
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,4096,1536,8,128,32,4,balanced,0.04534400006135305
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,4096,1536,8,128,16,8,power_law_1.2,0.16809600591659546
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,4096,1536,8,128,32,4,balanced,0.047541335225105286
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,4096,1536,8,128,16,8,power_law_1.2,0.21799039840698242
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,4096,1536,8,128,32,4,balanced,0.05584000051021576
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,4096,1536,8,128,16,8,power_law_1.2,0.2851263999938965
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,4096,1536,8,128,32,4,balanced,0.05724266668160757
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,4096,1536,8,128,16,8,power_law_1.2,0.39492480754852294
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,4096,1536,8,128,32,4,balanced,0.05748266478379568
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,4096,1536,8,128,32,4,balanced,0.05956799785296122
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,4096,1536,8,128,16,8,power_law_1.2,0.6201663970947265
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,4096,1536,8,128,32,4,balanced,0.053210665782292686
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,4096,1536,8,128,16,8,power_law_1.2,0.7444479942321778
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,4096,1536,8,128,32,4,balanced,0.055813332398732506
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,4096,1536,8,128,32,4,balanced,0.03276800115903219
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,4096,1536,8,128,16,8,power_law_1.2,1.0678144454956056
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,4096,1536,8,128,32,4,balanced,0.05729599793752035
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,4096,1536,8,128,32,4,balanced,0.03312533348798752
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,4096,1536,8,128,32,4,balanced,0.0595413347085317
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,4096,1536,8,128,16,8,power_law_1.2,1.7587776184082031
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,4096,1536,8,128,32,4,balanced,0.03492266684770584
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,4096,1536,8,128,32,4,balanced,0.06469866633415222
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,4096,1536,8,128,32,4,balanced,0.041946664452552795
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,4096,1536,8,128,16,8,power_law_1.2,3.6974143981933594
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,4096,1536,8,128,32,4,balanced,0.06666133304437001
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,4096,1536,8,128,32,4,balanced,0.05006400247414907
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,4096,1536,8,128,32,4,balanced,0.05077333251635233
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,4096,1536,8,128,32,4,balanced,0.07355733215808868
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,4096,1536,8,128,32,4,balanced,0.05050666630268097
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,4096,1536,8,128,32,4,balanced,0.08290133376916249
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,4096,1536,8,128,32,4,balanced,0.05017066498597463
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,4096,1536,8,128,32,4,balanced,0.050800000627835594
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,4096,1536,8,128,32,4,balanced,0.08964799841245015
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,4096,1536,8,128,32,4,balanced,0.05142933130264282
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,4096,1536,8,128,32,4,balanced,0.10682666301727295
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,4096,1536,8,128,32,4,balanced,0.05195199946562449
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,4096,1536,8,128,32,4,balanced,0.05377600093682607
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,4096,1536,8,128,32,4,balanced,0.11682666341463725
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,4096,1536,8,128,32,4,balanced,0.05464000006516775
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,4096,1536,8,128,32,4,balanced,0.05630933245023092
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,4096,1536,8,128,32,4,balanced,0.16476266582806906
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,4096,1536,8,128,32,4,balanced,0.06126933296521505
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,4096,1536,8,128,32,4,balanced,0.06227200229962667
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,4096,1536,8,128,32,4,balanced,0.06713066498438518
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,4096,1536,8,128,32,4,balanced,0.1649066706498464
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,4096,1536,8,128,32,4,balanced,0.07705066601435344
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,4096,1536,8,128,32,4,balanced,0.08622933427492778
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,4096,1536,8,128,32,4,power_law_1.01,0.036524799466133115
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,4096,1536,8,128,32,4,balanced,0.24086399873097739
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,4096,1536,8,128,32,4,balanced,0.10169600447018941
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,4096,1536,8,128,32,4,power_law_1.01,0.03559040129184723
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,4096,1536,8,128,32,4,power_law_1.01,0.036032000184059144
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,4096,1536,8,128,32,4,power_law_1.01,0.045407998561859134
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,4096,1536,8,128,32,4,balanced,0.11828800042470296
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,4096,1536,8,128,32,4,power_law_1.01,0.04892799854278564
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,4096,1536,8,128,32,4,power_law_1.01,0.05074560046195984
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,4096,1536,8,128,32,4,balanced,0.35417600472768146
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,4096,1536,8,128,32,4,power_law_1.01,0.05602560043334961
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,4096,1536,8,128,32,4,balanced,0.16404799620310465
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,4096,1536,8,128,32,4,power_law_1.01,0.05294719934463501
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,4096,1536,8,128,32,4,power_law_1.01,0.05687680244445801
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,4096,1536,8,128,32,4,power_law_1.01,0.0603007972240448
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,4096,1536,8,128,32,4,balanced,0.19850132862726846
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,4096,1536,8,128,32,4,power_law_1.01,0.05676159858703613
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,4096,1536,8,128,32,4,power_law_1.01,0.0355648010969162
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,4096,1536,8,128,32,4,power_law_1.01,0.05863680243492127
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,4096,1536,8,128,32,4,power_law_1.01,0.06096000075340271
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,4096,1536,8,128,32,4,power_law_1.01,0.03415679931640625
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,4096,1536,8,128,32,4,power_law_1.01,0.06658560037612915
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,4096,1536,8,128,32,4,balanced,0.529093345006307
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,4096,1536,8,128,32,4,power_law_1.01,0.034918400645256045
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,4096,1536,8,128,32,4,power_law_1.01,0.07223680019378662
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,4096,1536,8,128,32,4,balanced,0.2853813370068868
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,4096,1536,8,128,32,4,power_law_1.01,0.03776639997959137
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,4096,1536,8,128,32,4,power_law_1.01,0.07438079714775085
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,4096,1536,8,128,32,4,power_law_1.01,0.07917439937591553
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,4096,1536,8,128,32,4,power_law_1.01,0.040057599544525146
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,4096,1536,8,128,32,4,power_law_1.01,0.09207040071487427
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,4096,1536,8,128,32,4,power_law_1.01,0.047244799137115476
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,4096,1536,8,128,32,4,power_law_1.01,0.10435199737548828
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,4096,1536,8,128,32,4,power_law_1.01,0.04935680031776428
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,4096,1536,8,128,32,4,power_law_1.01,0.12499200105667115
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,4096,1536,8,128,32,4,balanced,0.38896532853444415
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,4096,1536,8,128,32,4,power_law_1.01,0.1500159978866577
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,4096,1536,8,128,32,4,power_law_1.01,0.0494592010974884
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,4096,1536,8,128,32,4,power_law_1.01,0.18515199422836304
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,4096,1536,8,128,32,4,power_law_1.01,0.050732797384262084
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,4096,1536,8,128,32,4,power_law_1.01,0.2165503978729248
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,4096,1536,8,128,32,4,balanced,0.6249759991963705
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,4096,1536,8,128,32,4,power_law_1.01,0.052288001775741576
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,4096,1536,8,128,32,4,power_law_1.01,0.3035648107528687
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,4096,1536,8,128,32,4,power_law_1.01,0.054073601961135864
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,4096,1536,8,128,32,4,power_law_1.01,0.4284992218017578
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,4096,1536,8,128,32,4,power_law_1.01,0.05854719877243042
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,4096,1536,8,128,32,4,power_law_1.01,0.5926271915435791
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,4096,1536,8,128,32,4,power_law_1.01,0.06000000238418579
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,4096,1536,8,128,32,4,power_law_1.01,0.7934720039367675
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,4096,1536,8,128,32,4,balanced,0.5750506718953451
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,4096,1536,8,128,32,4,power_law_1.01,0.061612802743911746
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,4096,1536,8,128,32,4,power_law_1.01,0.9117055892944336
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,4096,1536,8,128,32,4,power_law_1.01,0.06925439834594727
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,4096,1536,8,128,32,4,power_law_1.01,1.5276415824890137
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,4096,1536,8,128,32,4,power_law_1.01,0.07505919933319091
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,4096,1536,8,128,32,4,power_law_1.01,0.07530879974365234
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,4096,1536,8,128,32,4,power_law_1.01,3.2837249755859377
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,4096,1536,8,128,32,4,power_law_1.01,0.09990400075912476
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,4096,1536,8,128,32,4,power_law_1.01,0.10245120525360107
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,4096,1536,8,128,32,4,balanced,0.8058186372121176
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,4096,1536,8,128,32,4,power_law_1.01,0.1279744029045105
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,4096,1536,8,128,32,4,power_law_1.01,0.14572800397872926
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,4096,1536,8,128,32,4,balanced,0.7228906949361166
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,4096,1536,8,128,32,4,power_law_1.01,0.19892480373382568
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,4096,1536,8,128,32,4,power_law_1.01,0.25667200088500974
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,4096,1536,8,128,32,4,power_law_1.01,0.36487040519714353
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,4096,1536,8,128,32,4,power_law_1.01,0.44515199661254884
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,4096,1536,8,128,32,4,power_law_1.01,0.7055232048034668
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,4096,1536,8,128,32,4,power_law_1.01,0.9252544403076172
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,4096,1536,8,128,32,4,power_law_1.01,1.0944831848144532
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,4096,1536,8,128,32,4,power_law_1.01,1.8019584655761718
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,4096,1536,8,128,32,4,balanced,0.922714630762736
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,4096,1536,8,128,32,4,power_law_1.01,3.4735038757324217
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,4096,1536,8,128,32,4,balanced,1.215727965037028
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,4096,1536,8,128,32,4,power_law_1.2,0.036985599994659425
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,4096,1536,8,128,32,4,power_law_1.2,0.035462400317192076
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,4096,1536,8,128,32,4,power_law_1.2,0.036774399876594546
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,4096,1536,8,128,32,4,power_law_1.2,0.03973760008811951
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,4096,1536,8,128,32,4,balanced,1.3977866172790527
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,4096,1536,8,128,32,4,power_law_1.2,0.05069440007209778
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,4096,1536,8,128,32,4,power_law_1.2,0.05466880202293396
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,4096,1536,8,128,32,4,power_law_1.2,0.057094401121139525
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,4096,1536,8,128,32,4,power_law_1.2,0.055718398094177245
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,4096,1536,8,128,32,4,power_law_1.2,0.05822719931602478
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,4096,1536,8,128,32,4,power_law_1.2,0.06115840077400207
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,4096,1536,8,128,32,4,power_law_1.2,0.05680000185966492
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,4096,1536,8,128,32,4,power_law_1.2,0.0605567991733551
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,4096,1536,8,128,32,4,power_law_1.2,0.060889601707458496
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,4096,1536,8,128,32,4,power_law_1.2,0.06593919992446899
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,4096,1536,8,128,32,4,power_law_1.2,0.0756928026676178
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,4096,1536,8,128,32,4,power_law_1.2,0.035206401348114015
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,4096,1536,8,128,32,4,power_law_1.2,0.07544959783554077
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,4096,1536,8,128,32,4,power_law_1.2,0.03296639919281006
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,4096,1536,8,128,32,4,power_law_1.2,0.08133119940757752
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,4096,1536,8,128,32,4,power_law_1.2,0.03498879969120026
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,4096,1536,8,128,32,4,power_law_1.2,0.09899520277976989
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,4096,1536,8,128,32,4,power_law_1.2,0.11165440082550049
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,4096,1536,8,128,32,4,power_law_1.2,0.038726401329040525
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,4096,1536,8,128,32,4,balanced,2.405205408732096
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,4096,1536,8,128,32,4,power_law_1.2,0.1301695942878723
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,4096,1536,8,128,32,4,power_law_1.2,0.04222719967365265
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,4096,1536,8,128,32,4,power_law_1.2,0.15285760164260864
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,4096,1536,8,128,32,4,power_law_1.2,0.04830079972743988
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,4096,1536,8,128,32,4,power_law_1.2,0.1901247978210449
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,4096,1536,8,128,32,4,power_law_1.2,0.04916479885578155
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,4096,1536,8,128,32,4,power_law_1.2,0.04937599897384644
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,4096,1536,8,128,32,4,power_law_1.2,0.2598144054412842
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,4096,1536,8,128,32,4,power_law_1.2,0.05072640180587769
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,4096,1536,8,128,32,4,power_law_1.2,0.36294400691986084
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,4096,1536,8,128,32,4,power_law_1.2,0.05128960013389587
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,4096,1536,8,128,32,4,power_law_1.2,0.4878079891204834
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,4096,1536,8,128,32,4,power_law_1.2,0.05541759729385376
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,4096,1536,8,128,32,4,power_law_1.2,0.7967679977416993
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,4096,1536,8,128,32,4,power_law_1.2,0.05980799794197082
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,4096,1536,8,128,32,4,power_law_1.2,0.921395206451416
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,4096,1536,8,128,32,4,power_law_1.2,0.06209920048713684
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,4096,1536,8,128,32,4,power_law_1.2,1.2492608070373534
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,4096,1536,8,128,32,4,power_law_1.2,0.06213120222091675
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,4096,1536,8,128,32,4,power_law_1.2,2.227481651306152
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,4096,1536,8,128,32,4,power_law_1.2,0.07086079716682434
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,4096,1536,8,128,32,4,balanced,2.8081334431966147
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,4096,1536,8,128,32,4,power_law_1.2,0.07342079877853394
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,4096,1536,8,128,32,4,power_law_1.2,4.352108764648437
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,4096,1536,8,128,32,4,power_law_1.2,0.07987200021743775
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,4096,1536,8,128,32,4,power_law_1.2,0.10177919864654542
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,4096,1536,8,128,32,4,power_law_1.2,0.11173759698867798
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,4096,1536,8,128,32,4,power_law_1.2,0.13160320520401
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,4096,1536,8,128,32,4,power_law_1.2,0.15249279737472535
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,4096,1536,8,128,32,4,power_law_1.2,0.2060159921646118
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,4096,1536,8,128,32,4,power_law_1.2,0.2564480066299438
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,4096,1536,8,128,32,4,power_law_1.2,0.43422718048095704
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,4096,1536,8,128,32,4,power_law_1.2,0.5325056076049804
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,4096,1536,8,128,32,4,power_law_1.2,0.7871935844421387
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,4096,1536,8,128,32,4,power_law_1.2,1.0225472450256348
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,4096,1536,8,128,32,4,power_law_1.2,1.3827839851379395
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,4096,1536,8,128,32,4,power_law_1.2,2.3624704360961912
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,4096,1536,8,128,32,4,power_law_1.2,5.047590255737305
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,6144,2560,8,160,4,32,balanced,0.05287999908129374
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,6144,2560,8,160,4,32,balanced,0.05203199883302053
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,6144,2560,8,160,4,32,balanced,0.05189866820971171
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,6144,2560,8,160,4,32,balanced,0.05770133435726166
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,6144,2560,8,160,4,32,balanced,0.0676800012588501
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,6144,2560,8,160,4,32,balanced,0.07375999788443248
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,6144,2560,8,160,4,32,balanced,0.0735093355178833
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,6144,2560,8,160,4,32,balanced,0.07481599847475688
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,6144,2560,8,160,4,32,balanced,0.07479466497898102
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,6144,2560,8,160,4,32,balanced,0.07579199969768524
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,6144,2560,8,160,4,32,balanced,0.07668266693751018
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,6144,2560,8,160,4,32,balanced,0.07706133524576823
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,6144,2560,8,160,4,32,balanced,0.07768533130486806
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,6144,2560,8,160,4,32,balanced,0.08007466793060303
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,6144,2560,8,160,4,32,balanced,0.08377066254615784
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,6144,2560,8,160,4,32,balanced,0.0849226713180542
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,6144,2560,8,160,4,32,balanced,0.08629866441090901
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,6144,2560,8,160,4,32,balanced,0.10005866487820943
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,6144,2560,8,160,4,32,balanced,0.04795200129350027
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,6144,2560,8,160,4,32,balanced,0.09588266412417094
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,6144,2560,8,160,4,32,balanced,0.047194664676984154
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,6144,2560,8,160,4,32,balanced,0.12365866700808208
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,6144,2560,8,160,4,32,balanced,0.04715733230113983
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,6144,2560,8,160,4,32,balanced,0.11515733599662781
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,6144,2560,8,160,4,32,balanced,0.05132266879081726
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,6144,2560,8,160,4,32,balanced,0.054746667544047035
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,6144,2560,8,160,4,32,balanced,0.06226666768391927
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,6144,2560,8,160,4,32,balanced,0.15842666228612265
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,6144,2560,8,160,4,32,balanced,0.06347199777762096
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,6144,2560,8,160,4,32,balanced,0.06437333424886067
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,6144,2560,8,160,4,32,balanced,0.15914666652679443
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,6144,2560,8,160,4,32,balanced,0.0642133355140686
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,6144,2560,8,160,4,32,balanced,0.06542933483918507
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,6144,2560,8,160,4,32,balanced,0.04117333392302195
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,6144,2560,8,160,4,32,balanced,0.06650666892528534
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,6144,2560,8,160,4,32,balanced,0.23788267374038696
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,6144,2560,8,160,4,32,balanced,0.06681600213050842
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,6144,2560,8,160,4,32,balanced,0.04165866722663244
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,6144,2560,8,160,4,32,balanced,0.04171200096607208
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,6144,2560,8,160,4,32,balanced,0.06857066849867503
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,6144,2560,8,160,4,32,balanced,0.045514668027559914
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,6144,2560,8,160,4,32,balanced,0.07030933101971944
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,6144,2560,8,160,4,32,balanced,0.053226664662361145
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,6144,2560,8,160,4,32,balanced,0.0745600014925003
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,6144,2560,8,160,4,32,balanced,0.2568160096804301
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,6144,2560,8,160,4,32,balanced,0.05810666580994924
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,6144,2560,8,160,4,32,balanced,0.07812800010045369
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,6144,2560,8,160,4,32,balanced,0.05917333563168844
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,6144,2560,8,160,4,32,balanced,0.07999466856320699
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,6144,2560,8,160,4,32,balanced,0.059546664357185364
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,6144,2560,8,160,4,32,balanced,0.09735999504725139
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,6144,2560,8,160,4,32,balanced,0.06005866825580597
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,6144,2560,8,160,4,32,balanced,0.09603200356165568
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,6144,2560,8,160,4,32,balanced,0.3906293312708537
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,6144,2560,8,160,4,32,balanced,0.06047466893990835
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,6144,2560,8,160,4,32,balanced,0.12428800264994304
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,6144,2560,8,160,4,32,balanced,0.061706667145093284
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,6144,2560,8,160,4,32,balanced,0.06163200239340464
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,6144,2560,8,160,4,32,balanced,0.12693333625793457
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,6144,2560,8,160,4,32,balanced,0.06355733176072438
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,6144,2560,8,160,4,32,balanced,0.0641599992911021
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,6144,2560,8,160,4,32,balanced,0.16908800601959229
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,6144,2560,8,160,4,32,balanced,0.06852266689141591
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,6144,2560,8,160,4,32,balanced,0.45260266462961835
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,6144,2560,8,160,4,32,balanced,0.1934666633605957
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,6144,2560,8,160,4,32,balanced,0.07506666580835979
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,6144,2560,8,160,4,32,power_law_1.01,0.07850880026817322
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,6144,2560,8,160,4,32,balanced,0.2755626638730367
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,6144,2560,8,160,4,32,balanced,0.07732800145943959
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,6144,2560,8,160,4,32,power_law_1.01,0.07216640114784241
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,6144,2560,8,160,4,32,power_law_1.01,0.06287360191345215
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,6144,2560,8,160,4,32,power_law_1.01,0.06528000235557556
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,6144,2560,8,160,4,32,power_law_1.01,0.06842880249023438
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,6144,2560,8,160,4,32,balanced,0.32840534051259357
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,6144,2560,8,160,4,32,balanced,0.5461599826812744
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,6144,2560,8,160,4,32,power_law_1.01,0.06924160122871399
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,6144,2560,8,160,4,32,balanced,0.08401067058245341
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,6144,2560,8,160,4,32,power_law_1.01,0.07180799841880799
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,6144,2560,8,160,4,32,power_law_1.01,0.07318400144577027
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,6144,2560,8,160,4,32,balanced,0.09115200241406758
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,6144,2560,8,160,4,32,power_law_1.01,0.07438719868659974
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,6144,2560,8,160,4,32,power_law_1.01,0.07635200023651123
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,6144,2560,8,160,4,32,power_law_1.01,0.07936639785766601
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,6144,2560,8,160,4,32,power_law_1.01,0.08478720188140869
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,6144,2560,8,160,4,32,balanced,0.4838666518529256
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,6144,2560,8,160,4,32,power_law_1.01,0.08659840226173401
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,6144,2560,8,160,4,32,power_law_1.01,0.08702719807624817
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,6144,2560,8,160,4,32,power_law_1.01,0.09598079919815064
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,6144,2560,8,160,4,32,balanced,0.10709866881370544
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,6144,2560,8,160,4,32,power_law_1.01,0.09731839895248413
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,6144,2560,8,160,4,32,power_law_1.01,0.11340160369873047
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,6144,2560,8,160,4,32,balanced,0.12040000160535176
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,6144,2560,8,160,4,32,power_law_1.01,0.13345279693603515
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,6144,2560,8,160,4,32,power_law_1.01,0.13138560056686402
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,6144,2560,8,160,4,32,power_law_1.01,0.17586560249328614
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,6144,2560,8,160,4,32,power_law_1.01,0.06261119842529297
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,6144,2560,8,160,4,32,balanced,0.5950453281402588
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,6144,2560,8,160,4,32,power_law_1.01,0.17655680179595948
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,6144,2560,8,160,4,32,balanced,0.7837386926015218
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,6144,2560,8,160,4,32,power_law_1.01,0.05509120225906372
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,6144,2560,8,160,4,32,power_law_1.01,0.2665600061416626
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,6144,2560,8,160,4,32,balanced,0.15516799688339233
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,6144,2560,8,160,4,32,power_law_1.01,0.05545600056648255
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,6144,2560,8,160,4,32,power_law_1.01,0.05225600004196167
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,6144,2560,8,160,4,32,power_law_1.01,0.28739840984344484
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,6144,2560,8,160,4,32,power_law_1.01,0.05411199927330017
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,6144,2560,8,160,4,32,power_law_1.01,0.37448959350585936
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,6144,2560,8,160,4,32,power_law_1.01,0.052691197395324706
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,6144,2560,8,160,4,32,power_law_1.01,0.055961602926254274
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,6144,2560,8,160,4,32,power_law_1.01,0.4055039882659912
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,6144,2560,8,160,4,32,power_law_1.01,0.04442879855632782
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,6144,2560,8,160,4,32,balanced,0.18081067005793253
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,6144,2560,8,160,4,32,power_law_1.01,0.06110079884529114
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,6144,2560,8,160,4,32,power_law_1.01,0.6470655918121337
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,6144,2560,8,160,4,32,power_law_1.01,0.05075200200080872
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,6144,2560,8,160,4,32,power_law_1.01,0.061478400230407716
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,6144,2560,8,160,4,32,power_law_1.01,0.05478399991989136
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,6144,2560,8,160,4,32,power_law_1.01,0.9005951881408691
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,6144,2560,8,160,4,32,power_law_1.01,0.06212480068206787
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,6144,2560,8,160,4,32,power_law_1.01,0.0633791983127594
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,6144,2560,8,160,4,32,power_law_1.01,0.0571008026599884
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,6144,2560,8,160,4,32,power_law_1.01,1.0766016006469727
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,6144,2560,8,160,4,32,balanced,0.7291466395060221
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,6144,2560,8,160,4,32,power_law_1.01,0.06515840291976929
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,6144,2560,8,160,4,32,power_law_1.01,0.05982720255851746
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,6144,2560,8,160,4,32,power_law_1.01,1.589574432373047
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,6144,2560,8,160,4,32,power_law_1.01,0.06702719926834107
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,6144,2560,8,160,4,32,balanced,0.24758932987848917
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,6144,2560,8,160,4,32,power_law_1.01,0.059628802537918094
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,6144,2560,8,160,4,32,power_law_1.01,0.06992639899253845
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,6144,2560,8,160,4,32,power_law_1.01,3.0148288726806642
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,6144,2560,8,160,4,32,power_law_1.2,0.07259520292282104
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,6144,2560,8,160,4,32,power_law_1.01,0.060915201902389526
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,6144,2560,8,160,4,32,power_law_1.01,0.07196159958839417
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,6144,2560,8,160,4,32,power_law_1.01,0.06249600052833557
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,6144,2560,8,160,4,32,power_law_1.2,0.06207360029220581
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,6144,2560,8,160,4,32,power_law_1.01,0.0782912015914917
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,6144,2560,8,160,4,32,power_law_1.01,0.06565759778022766
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,6144,2560,8,160,4,32,power_law_1.2,0.06498559713363647
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,6144,2560,8,160,4,32,power_law_1.01,0.08711680173873901
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,6144,2560,8,160,4,32,balanced,0.323525329430898
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,6144,2560,8,160,4,32,power_law_1.2,0.06366080045700073
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,6144,2560,8,160,4,32,power_law_1.01,0.06539520025253295
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,6144,2560,8,160,4,32,power_law_1.01,0.09159039855003356
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,6144,2560,8,160,4,32,power_law_1.01,0.07027199864387512
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,6144,2560,8,160,4,32,power_law_1.01,0.09415680170059204
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,6144,2560,8,160,4,32,power_law_1.2,0.06659839749336242
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,6144,2560,8,160,4,32,power_law_1.2,0.06468480229377746
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,6144,2560,8,160,4,32,power_law_1.01,0.11825920343399048
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,6144,2560,8,160,4,32,power_law_1.2,0.07294080257415772
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,6144,2560,8,160,4,32,power_law_1.01,0.0787775993347168
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,6144,2560,8,160,4,32,power_law_1.01,0.12437759637832642
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,6144,2560,8,160,4,32,power_law_1.2,0.05112959742546082
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,6144,2560,8,160,4,32,power_law_1.2,0.07122560143470764
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,6144,2560,8,160,4,32,power_law_1.01,0.08982399702072144
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,6144,2560,8,160,4,32,power_law_1.01,0.147161602973938
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,6144,2560,8,160,4,32,power_law_1.2,0.052300798892974856
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,6144,2560,8,160,4,32,power_law_1.2,0.07459200024604798
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,6144,2560,8,160,4,32,balanced,0.46120532353719074
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,6144,2560,8,160,4,32,power_law_1.01,0.16660480499267577
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,6144,2560,8,160,4,32,power_law_1.01,0.08922880291938781
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,6144,2560,8,160,4,32,power_law_1.2,0.05573760271072388
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,6144,2560,8,160,4,32,power_law_1.2,0.07571200132369996
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,6144,2560,8,160,4,32,power_law_1.01,0.2248768091201782
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,6144,2560,8,160,4,32,balanced,1.1131253242492676
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,6144,2560,8,160,4,32,power_law_1.2,0.07800319790840149
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,6144,2560,8,160,4,32,power_law_1.2,0.05689600110054016
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,6144,2560,8,160,4,32,power_law_1.01,0.09528959989547729
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,6144,2560,8,160,4,32,power_law_1.01,0.27959680557250977
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,6144,2560,8,160,4,32,power_law_1.2,0.06060799956321716
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,6144,2560,8,160,4,32,power_law_1.2,0.08372480273246766
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,6144,2560,8,160,4,32,power_law_1.2,0.06220160126686096
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,6144,2560,8,160,4,32,power_law_1.01,0.36221439838409425
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,6144,2560,8,160,4,32,power_law_1.2,0.08341119885444641
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,6144,2560,8,160,4,32,balanced,1.5118239720662434
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,6144,2560,8,160,4,32,power_law_1.01,0.1120576024055481
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,6144,2560,8,160,4,32,power_law_1.2,0.06255999803543091
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,6144,2560,8,160,4,32,power_law_1.01,0.4475711822509766
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,6144,2560,8,160,4,32,power_law_1.2,0.08604800105094909
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,6144,2560,8,160,4,32,power_law_1.2,0.06714879870414733
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,6144,2560,8,160,4,32,power_law_1.01,0.13260799646377563
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,6144,2560,8,160,4,32,power_law_1.2,0.09007999897003174
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,6144,2560,8,160,4,32,power_law_1.01,0.6673920154571533
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,6144,2560,8,160,4,32,power_law_1.2,0.06741759777069092
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,6144,2560,8,160,4,32,power_law_1.2,0.09445760250091553
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,6144,2560,8,160,4,32,power_law_1.01,0.8969023704528809
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,6144,2560,8,160,4,32,power_law_1.2,0.0700160026550293
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,6144,2560,8,160,4,32,power_law_1.2,0.09909759759902954
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,6144,2560,8,160,4,32,power_law_1.01,1.0113920211791991
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,6144,2560,8,160,4,32,power_law_1.01,0.16380159854888915
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,6144,2560,8,160,4,32,balanced,0.603498657544454
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,6144,2560,8,160,4,32,power_law_1.2,0.07249280214309692
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,6144,2560,8,160,4,32,power_law_1.2,0.1184000015258789
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,6144,2560,8,160,4,32,power_law_1.01,0.19495680332183837
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,6144,2560,8,160,4,32,power_law_1.01,1.6661376953125
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,6144,2560,8,160,4,32,power_law_1.2,0.07411199808120728
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,6144,2560,8,160,4,32,power_law_1.2,0.15204479694366455
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,6144,2560,8,160,4,32,power_law_1.2,0.07875840067863464
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,6144,2560,8,160,4,32,power_law_1.2,0.15516799688339233
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,6144,2560,8,160,4,32,power_law_1.01,3.4134654998779297
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,6144,2560,8,160,4,32,power_law_1.01,0.27582080364227296
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,6144,2560,8,160,4,32,power_law_1.2,0.08799999952316284
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,6144,2560,8,160,4,32,power_law_1.2,0.20156800746917725
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,6144,2560,8,160,4,32,power_law_1.01,0.40427517890930176
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,6144,2560,8,160,4,32,power_law_1.2,0.09585919976234436
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,6144,2560,8,160,4,32,power_law_1.2,0.21203200817108153
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,6144,2560,8,160,4,32,power_law_1.2,0.10012160539627075
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,6144,2560,8,160,4,32,power_law_1.2,0.29008638858795166
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,6144,2560,8,160,4,32,power_law_1.01,0.523526382446289
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,6144,2560,8,160,4,32,power_law_1.2,0.13396480083465576
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,6144,2560,8,160,4,32,power_law_1.2,0.3564543962478638
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,6144,2560,8,160,4,32,power_law_1.2,0.1302016019821167
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,6144,2560,8,160,4,32,power_law_1.01,0.6785727977752686
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,6144,2560,8,160,4,32,power_law_1.2,0.5297152042388916
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,6144,2560,8,160,4,32,balanced,0.736746629079183
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,6144,2560,8,160,4,32,power_law_1.2,0.16807039976119995
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,6144,2560,8,160,4,32,power_law_1.01,1.012275218963623
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,6144,2560,8,160,4,32,power_law_1.2,0.5605184078216553
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,6144,2560,8,160,4,32,power_law_1.2,0.19381120204925537
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,6144,2560,8,160,4,32,power_law_1.2,0.8485887527465821
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,6144,2560,8,160,4,32,power_law_1.2,0.24252800941467284
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,6144,2560,8,160,4,32,power_law_1.01,1.257408046722412
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,6144,2560,8,160,4,32,power_law_1.2,1.3447360038757323
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,6144,2560,8,160,4,32,power_law_1.2,0.3396352052688599
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,6144,2560,8,160,4,32,power_law_1.01,1.8475008010864258
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,6144,2560,8,160,4,32,power_law_1.2,0.5201536178588867
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,6144,2560,8,160,4,32,power_law_1.2,1.8864639282226563
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,6144,2560,8,160,4,32,power_law_1.01,2.9959999084472657
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,6144,2560,8,160,4,32,power_law_1.2,0.5894656181335449
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,6144,2560,8,160,4,32,power_law_1.2,2.535103988647461
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,6144,2560,8,160,4,32,power_law_1.2,0.8706111907958984
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,6144,2560,8,160,4,32,power_law_1.01,5.829427337646484
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,6144,2560,8,160,4,32,power_law_1.2,5.08458251953125
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,6144,2560,8,160,4,32,power_law_1.2,1.429094409942627
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,6144,2560,8,160,4,32,balanced,2.174880027770996
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,6144,2560,8,160,4,32,power_law_1.2,1.5311103820800782
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,6144,2560,8,160,4,32,power_law_1.2,2.9922624588012696
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,6144,2560,8,160,4,32,balanced,1.1391626993815105
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,6144,2560,8,160,4,32,power_law_1.2,5.645030212402344
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,6144,2560,8,160,4,32,balanced,2.277887980143229
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,6144,2560,8,160,4,32,power_law_1.2,0.05436800122261047
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,6144,2560,8,160,4,32,power_law_1.2,0.04350079894065857
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,6144,2560,8,160,4,32,power_law_1.2,0.04428800046443939
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,6144,2560,8,160,4,32,power_law_1.2,0.05075200200080872
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,6144,2560,8,160,4,32,power_law_1.2,0.05348479747772217
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,6144,2560,8,160,4,32,power_law_1.2,0.05724160075187683
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,6144,2560,8,160,4,32,power_law_1.2,0.05896959900856018
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,6144,2560,8,160,4,32,power_law_1.2,0.06193280220031738
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,6144,2560,8,160,4,32,power_law_1.2,0.060915201902389526
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,6144,2560,8,160,4,32,power_law_1.2,0.06305279731750488
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,6144,2560,8,160,4,32,power_law_1.2,0.0673471987247467
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,6144,2560,8,160,8,16,balanced,0.05063466727733612
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,6144,2560,8,160,4,32,power_law_1.2,0.06876159906387329
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,6144,2560,8,160,8,16,balanced,0.051669334371884666
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,6144,2560,8,160,4,32,power_law_1.2,0.07247999906539918
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,6144,2560,8,160,8,16,balanced,0.05194666484991709
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,6144,2560,8,160,4,32,power_law_1.2,0.08681600093841553
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,6144,2560,8,160,8,16,balanced,0.060693333546320595
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,6144,2560,8,160,4,32,power_law_1.2,0.0871999979019165
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,6144,2560,8,160,8,16,balanced,0.07155733307202657
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,6144,2560,8,160,8,16,balanced,0.07743466893831889
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,6144,2560,8,160,4,32,power_law_1.2,0.09256960153579712
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,6144,2560,8,160,8,16,balanced,0.07855999966462453
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,6144,2560,8,160,8,16,balanced,0.07975466549396515
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,6144,2560,8,160,4,32,power_law_1.2,0.10151040554046631
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,6144,2560,8,160,8,16,balanced,0.07905066510041554
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,6144,2560,8,160,8,16,balanced,0.04567466676235199
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,6144,2560,8,160,8,16,balanced,0.08012799918651581
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,6144,2560,8,160,8,16,balanced,0.04716266691684723
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,6144,2560,8,160,8,16,balanced,0.08171199758847554
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,6144,2560,8,160,8,16,balanced,0.046480000019073486
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,6144,2560,8,160,4,32,power_law_1.2,0.1197119951248169
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,6144,2560,8,160,8,16,balanced,0.08298133313655853
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,6144,2560,8,160,8,16,balanced,0.05221333106358846
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,6144,2560,8,160,4,32,power_law_1.2,0.14151040315628052
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,6144,2560,8,160,8,16,balanced,0.0823359986146291
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,6144,2560,8,160,8,16,balanced,0.05922133227189382
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,6144,2560,8,160,8,16,balanced,0.08428266644477844
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,6144,2560,8,160,8,16,balanced,0.06529066463311513
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,6144,2560,8,160,8,16,balanced,0.06632533172766368
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,6144,2560,8,160,8,16,balanced,0.08658666412035625
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,6144,2560,8,160,4,32,power_law_1.2,0.1643839955329895
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,6144,2560,8,160,8,16,balanced,0.06695466736952464
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,6144,2560,8,160,8,16,balanced,0.0929813285668691
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,6144,2560,8,160,4,32,power_law_1.2,0.24191999435424805
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,6144,2560,8,160,8,16,balanced,0.06673599779605865
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,6144,2560,8,160,8,16,balanced,0.08899199962615967
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,6144,2560,8,160,8,16,balanced,0.06791466474533081
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,6144,2560,8,160,4,32,power_law_1.2,0.32150399684906006
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,6144,2560,8,160,8,16,balanced,0.11116266250610352
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,6144,2560,8,160,8,16,balanced,0.06835733354091644
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,6144,2560,8,160,4,32,power_law_1.2,0.4839871883392334
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,6144,2560,8,160,8,16,balanced,0.06903466582298279
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,6144,2560,8,160,8,16,balanced,0.10325866937637329
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,6144,2560,8,160,8,16,balanced,0.07075199981530507
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,6144,2560,8,160,4,32,power_law_1.2,0.7220863819122314
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,6144,2560,8,160,8,16,balanced,0.13570132851600647
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,6144,2560,8,160,8,16,balanced,0.07374933362007141
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,6144,2560,8,160,8,16,balanced,0.07585066556930542
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,6144,2560,8,160,4,32,power_law_1.2,1.1155263900756835
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,6144,2560,8,160,8,16,balanced,0.12650133172671
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,6144,2560,8,160,8,16,balanced,0.07892266909281413
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,6144,2560,8,160,4,32,power_law_1.2,1.3110655784606933
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,6144,2560,8,160,8,16,balanced,0.08136000235875447
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,6144,2560,8,160,8,16,power_law_1.01,0.07379840016365051
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,6144,2560,8,160,8,16,balanced,0.17096000909805298
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,6144,2560,8,160,4,32,power_law_1.2,1.7456192016601562
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,6144,2560,8,160,8,16,balanced,0.1049066682656606
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,6144,2560,8,160,8,16,power_law_1.01,0.07553279995918274
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,6144,2560,8,160,8,16,balanced,0.10169600447018941
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,6144,2560,8,160,8,16,power_law_1.01,0.06033920049667359
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,6144,2560,8,160,4,32,power_law_1.2,3.340300750732422
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,6144,2560,8,160,8,16,balanced,0.17941333850224814
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,6144,2560,8,160,8,16,power_law_1.01,0.061401599645614625
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,6144,2560,8,160,8,16,balanced,0.1344106694062551
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,6144,2560,8,160,4,32,power_law_1.2,4.5159553527832035
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,6144,2560,8,160,8,16,power_law_1.01,0.06552960276603699
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,6144,2560,8,160,8,16,power_law_1.01,0.06314240097999572
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,6144,2560,8,160,8,16,balanced,0.1341546674569448
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,6144,2560,8,160,8,16,power_law_1.01,0.07412480115890503
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,6144,2560,8,160,8,16,balanced,0.04140799989302953
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,6144,2560,8,160,8,16,balanced,0.26362667481104535
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,6144,2560,8,160,8,16,power_law_1.01,0.06001920104026794
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,6144,2560,8,160,4,32,power_law_1.2,9.906886291503906
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,6144,2560,8,160,8,16,power_law_1.01,0.0754751980304718
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,6144,2560,8,160,8,16,power_law_1.01,0.049568000435829165
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,6144,2560,8,160,8,16,balanced,0.042133331298828125
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,6144,2560,8,160,8,16,power_law_1.01,0.07499520182609558
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,6144,2560,8,160,8,16,power_law_1.01,0.05533440113067627
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,6144,2560,8,160,8,16,balanced,0.04262933135032654
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,6144,2560,8,160,8,16,balanced,0.18141865730285645
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,6144,2560,8,160,8,16,power_law_1.01,0.05553920269012451
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,6144,2560,8,160,8,16,power_law_1.01,0.07832319736480713
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,6144,2560,8,160,8,16,power_law_1.01,0.056492799520492555
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,6144,2560,8,160,8,16,balanced,0.047872001926104225
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,6144,2560,8,160,8,16,balanced,0.055861334005991616
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,6144,2560,8,160,8,16,power_law_1.01,0.07736319899559022
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,6144,2560,8,160,8,16,power_law_1.01,0.060070401430130003
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,6144,2560,8,160,8,16,power_law_1.01,0.05720959901809693
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,6144,2560,8,160,8,16,balanced,0.2963520089785258
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,6144,2560,8,160,8,16,balanced,0.0605973352988561
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,6144,2560,8,160,8,16,balanced,0.20801067352294922
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,6144,2560,8,160,8,16,power_law_1.01,0.061689597368240354
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,6144,2560,8,160,8,16,power_law_1.01,0.08117120265960694
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,6144,2560,8,160,8,16,power_law_1.01,0.046758401393890384
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,6144,2560,8,160,8,16,balanced,0.062181333700815834
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,6144,2560,8,160,8,16,power_law_1.01,0.06185600161552429
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,6144,2560,8,160,8,16,power_law_1.01,0.08362879753112792
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,6144,2560,8,160,8,16,balanced,0.06275733311971028
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,6144,2560,8,160,8,16,power_law_1.01,0.05249919891357422
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,6144,2560,8,160,8,16,balanced,0.06317866841952006
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,6144,2560,8,160,8,16,power_law_1.01,0.06323199868202209
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,6144,2560,8,160,8,16,power_law_1.01,0.0856383979320526
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,6144,2560,8,160,8,16,power_law_1.01,0.05478399991989136
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,6144,2560,8,160,8,16,balanced,0.06390933195749919
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,6144,2560,8,160,8,16,power_law_1.01,0.06684160232543945
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,6144,2560,8,160,8,16,balanced,0.29873599608739215
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,6144,2560,8,160,8,16,power_law_1.01,0.09037439823150635
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,6144,2560,8,160,8,16,balanced,0.06529066463311513
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,6144,2560,8,160,8,16,power_law_1.01,0.05873280167579651
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,6144,2560,8,160,8,16,balanced,0.0653706689675649
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,6144,2560,8,160,8,16,power_law_1.01,0.0691968023777008
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,6144,2560,8,160,8,16,power_law_1.01,0.11626240015029907
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,6144,2560,8,160,8,16,balanced,0.4452373186747233
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,6144,2560,8,160,8,16,power_law_1.01,0.059961599111557004
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,6144,2560,8,160,8,16,balanced,0.06807999809583028
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,6144,2560,8,160,8,16,power_law_1.01,0.07235199809074402
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,6144,2560,8,160,8,16,power_law_1.01,0.11633919477462769
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,6144,2560,8,160,8,16,power_law_1.01,0.06335359811782837
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,6144,2560,8,160,8,16,balanced,0.06982400019963582
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,6144,2560,8,160,8,16,power_law_1.01,0.07240319848060608
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,6144,2560,8,160,8,16,power_law_1.01,0.10898560285568237
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,6144,2560,8,160,8,16,balanced,0.07377600173155467
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,6144,2560,8,160,8,16,power_law_1.01,0.06403200030326843
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,6144,2560,8,160,8,16,balanced,0.36054933071136475
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,6144,2560,8,160,8,16,power_law_1.01,0.07519999742507935
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,6144,2560,8,160,8,16,power_law_1.01,0.13013119697570802
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,6144,2560,8,160,8,16,power_law_1.01,0.06700800061225891
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,6144,2560,8,160,8,16,power_law_1.01,0.0818943977355957
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,6144,2560,8,160,8,16,power_law_1.01,0.06970880031585694
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,6144,2560,8,160,8,16,power_law_1.01,0.1351040005683899
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,6144,2560,8,160,8,16,balanced,0.08107199768225352
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,6144,2560,8,160,8,16,power_law_1.01,0.08724480271339416
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,6144,2560,8,160,8,16,power_law_1.01,0.07223039865493774
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,6144,2560,8,160,8,16,power_law_1.01,0.16643840074539185
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,6144,2560,8,160,8,16,power_law_1.01,0.0990015983581543
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,6144,2560,8,160,8,16,power_law_1.01,0.07729920148849487
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,6144,2560,8,160,8,16,power_law_1.01,0.18241280317306519
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,6144,2560,8,160,8,16,power_law_1.01,0.11838719844818116
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,6144,2560,8,160,8,16,balanced,0.08613866567611694
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,6144,2560,8,160,8,16,balanced,0.5292266607284546
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,6144,2560,8,160,8,16,power_law_1.01,0.08193920254707336
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,6144,2560,8,160,8,16,power_law_1.01,0.23332479000091552
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,6144,2560,8,160,8,16,power_law_1.01,0.12487679719924927
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,6144,2560,8,160,8,16,power_law_1.01,0.08765439987182617
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,6144,2560,8,160,8,16,power_law_1.01,0.2755712032318115
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,6144,2560,8,160,8,16,balanced,0.5266293287277222
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,6144,2560,8,160,8,16,power_law_1.01,0.15296640396118164
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,6144,2560,8,160,8,16,power_law_1.01,0.1712448000907898
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,6144,2560,8,160,8,16,power_law_1.01,0.3858304023742676
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,6144,2560,8,160,8,16,power_law_1.01,0.09419519901275634
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,6144,2560,8,160,8,16,power_law_1.01,0.22133760452270507
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,6144,2560,8,160,8,16,power_law_1.01,0.45486721992492674
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,6144,2560,8,160,8,16,power_law_1.01,0.2783616065979004
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,6144,2560,8,160,8,16,balanced,0.09603733817736308
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,6144,2560,8,160,8,16,power_law_1.01,0.6922688007354736
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,6144,2560,8,160,8,16,power_law_1.01,0.3758080005645752
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,6144,2560,8,160,8,16,power_law_1.01,0.10919040441513062
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,6144,2560,8,160,8,16,balanced,0.10496000448862712
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,6144,2560,8,160,8,16,power_law_1.01,0.8349568367004394
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,6144,2560,8,160,8,16,power_law_1.01,0.5015744209289551
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,6144,2560,8,160,8,16,power_law_1.01,0.7020800113677979
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,6144,2560,8,160,8,16,power_law_1.01,1.048703956604004
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,6144,2560,8,160,8,16,power_law_1.01,0.11966079473495483
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,6144,2560,8,160,8,16,power_law_1.01,0.9086336135864258
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,6144,2560,8,160,8,16,balanced,0.626858671506246
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,6144,2560,8,160,8,16,power_law_1.01,1.5439743995666504
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,6144,2560,8,160,8,16,balanced,0.6522773504257202
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,6144,2560,8,160,8,16,power_law_1.01,0.13904639482498168
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,6144,2560,8,160,8,16,power_law_1.01,1.1165568351745605
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,6144,2560,8,160,8,16,power_law_1.2,0.07359359860420227
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,6144,2560,8,160,8,16,power_law_1.01,1.7994880676269531
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,6144,2560,8,160,8,16,power_law_1.01,3.4543041229248046
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,6144,2560,8,160,8,16,balanced,0.12642133235931396
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,6144,2560,8,160,8,16,power_law_1.2,0.055718398094177245
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,6144,2560,8,160,8,16,power_law_1.01,0.1680896043777466
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,6144,2560,8,160,8,16,power_law_1.01,3.5490177154541014
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,6144,2560,8,160,8,16,balanced,0.14383467038472494
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,6144,2560,8,160,8,16,power_law_1.2,0.06050559878349304
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,6144,2560,8,160,8,16,power_law_1.01,0.22911999225616456
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,6144,2560,8,160,8,16,power_law_1.2,0.0636031985282898
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,6144,2560,8,160,8,16,power_law_1.2,0.06376960277557372
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,6144,2560,8,160,8,16,power_law_1.01,0.28666880130767824
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,6144,2560,8,160,8,16,power_law_1.2,0.07464960217475891
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,6144,2560,8,160,8,16,balanced,0.19167466958363852
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,6144,2560,8,160,8,16,power_law_1.01,0.4148672103881836
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,6144,2560,8,160,8,16,power_law_1.2,0.07326719760894776
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,6144,2560,8,160,8,16,balanced,0.7902560234069824
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,6144,2560,8,160,8,16,power_law_1.2,0.07774080038070678
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,6144,2560,8,160,8,16,balanced,0.2383306622505188
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,6144,2560,8,160,8,16,power_law_1.2,0.07772160172462464
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,6144,2560,8,160,8,16,power_law_1.01,0.6164608001708984
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,6144,2560,8,160,8,16,power_law_1.2,0.07915520071983337
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,6144,2560,8,160,8,16,balanced,0.9391146500905355
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,6144,2560,8,160,8,16,power_law_1.01,0.8034175872802735
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,6144,2560,8,160,8,16,power_law_1.2,0.08330240249633789
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,6144,2560,8,160,8,16,power_law_1.2,0.0887167990207672
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,6144,2560,8,160,8,16,power_law_1.01,1.1127424240112305
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,6144,2560,8,160,8,16,balanced,0.3505280017852783
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,6144,2560,8,160,8,16,power_law_1.2,0.09095039963722229
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,6144,2560,8,160,8,16,power_law_1.01,1.339846420288086
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,6144,2560,8,160,8,16,power_law_1.2,0.1034816026687622
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,6144,2560,8,160,8,16,power_law_1.01,1.8716032028198242
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,6144,2560,8,160,8,16,power_law_1.2,0.11641600131988525
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,6144,2560,8,160,8,16,power_law_1.2,0.12220159769058228
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,6144,2560,8,160,8,16,balanced,0.45340800285339355
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,6144,2560,8,160,8,16,power_law_1.01,2.9791040420532227
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,6144,2560,8,160,8,16,power_law_1.2,0.11166720390319824
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,6144,2560,8,160,8,16,power_law_1.2,0.12999680042266845
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,6144,2560,8,160,8,16,power_law_1.01,5.472639846801758
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,6144,2560,8,160,8,16,power_law_1.2,0.13808640241622924
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,6144,2560,8,160,8,16,balanced,1.2220160166422527
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,6144,2560,8,160,8,16,power_law_1.2,0.18520959615707397
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,6144,2560,8,160,8,16,power_law_1.2,0.18925440311431885
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,6144,2560,8,160,8,16,balanced,0.6329226493835449
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,6144,2560,8,160,8,16,power_law_1.2,0.2766144037246704
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,6144,2560,8,160,8,16,power_law_1.2,0.33747200965881347
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,6144,2560,8,160,8,16,power_law_1.2,0.4797247886657715
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,6144,2560,8,160,8,16,power_law_1.2,0.6003200054168701
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,6144,2560,8,160,8,16,power_law_1.2,0.8431743621826172
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,6144,2560,8,160,8,16,balanced,0.8331147034962972
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,6144,2560,8,160,8,16,power_law_1.2,1.267039966583252
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,6144,2560,8,160,8,16,power_law_1.2,1.517471981048584
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,6144,2560,8,160,8,16,power_law_1.2,2.097452735900879
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,6144,2560,8,160,8,16,power_law_1.2,5.509843063354492
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,6144,2560,8,160,8,16,balanced,1.7948533693949382
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,6144,2560,8,160,8,16,balanced,1.0187466939290364
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,6144,2560,8,160,8,16,balanced,2.3936373392740884
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,6144,2560,8,160,8,16,balanced,1.5842186609903972
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,6144,2560,8,160,8,16,power_law_1.2,0.06121600270271301
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,6144,2560,8,160,8,16,power_law_1.2,0.05117440223693848
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,6144,2560,8,160,8,16,power_law_1.2,0.05125759840011597
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,6144,2560,8,160,8,16,power_law_1.2,0.054553598165512085
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,6144,2560,8,160,8,16,power_law_1.2,0.05608320236206055
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,6144,2560,8,160,8,16,power_law_1.2,0.06188160181045532
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,6144,2560,8,160,8,16,power_law_1.2,0.06317440271377564
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,6144,2560,8,160,8,16,power_law_1.2,0.06580479741096497
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,6144,2560,8,160,8,16,power_law_1.2,0.06647040247917176
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,6144,2560,8,160,8,16,power_law_1.2,0.06721919775009155
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,6144,2560,8,160,8,16,power_law_1.2,0.06997759938240052
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,6144,2560,8,160,8,16,power_law_1.2,0.0733568012714386
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,6144,2560,8,160,8,16,power_law_1.2,0.07900159955024719
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,6144,2560,8,160,8,16,power_law_1.2,0.07575039863586426
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,6144,2560,8,160,8,16,power_law_1.2,0.08339200019836426
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,6144,2560,8,160,8,16,power_law_1.2,0.09028480052947999
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,6144,2560,8,160,8,16,power_law_1.2,0.10039680004119873
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,6144,2560,8,160,8,16,power_law_1.2,0.11848959922790528
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,6144,2560,8,160,8,16,power_law_1.2,0.13017599582672118
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,6144,2560,8,160,8,16,power_law_1.2,0.1664576053619385
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,6144,2560,8,160,8,16,power_law_1.2,0.19048960208892823
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,6144,2560,8,160,8,16,balanced,3.1507040659586587
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,6144,2560,8,160,8,16,power_law_1.2,0.2410111904144287
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,6144,2560,8,160,8,16,power_law_1.2,0.3096895933151245
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,6144,2560,8,160,8,16,power_law_1.2,0.056550401449203494
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,6144,2560,8,160,8,16,power_law_1.2,0.44268159866333007
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,6144,2560,8,160,8,16,power_law_1.2,0.047891199588775635
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,6144,2560,8,160,8,16,power_law_1.2,0.5568064212799072
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,6144,2560,8,160,8,16,power_law_1.2,0.04535039961338043
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,6144,2560,8,160,16,8,balanced,0.051701332132021584
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,6144,2560,8,160,8,16,power_law_1.2,0.9015040397644043
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,6144,2560,8,160,8,16,power_law_1.2,0.05182719826698303
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,6144,2560,8,160,16,8,balanced,0.052005335688591
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,6144,2560,8,160,8,16,power_law_1.2,1.0787199974060058
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,6144,2560,8,160,8,16,power_law_1.2,0.053529602289199826
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,6144,2560,8,160,16,8,balanced,0.05438933273156484
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,6144,2560,8,160,8,16,power_law_1.2,0.06102399826049805
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,6144,2560,8,160,16,8,balanced,0.062047998110453285
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,6144,2560,8,160,8,16,power_law_1.2,1.3847807884216308
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,6144,2560,8,160,16,8,balanced,0.0728959987560908
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,6144,2560,8,160,8,16,power_law_1.2,0.05987200140953064
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,6144,2560,8,160,8,16,power_law_1.2,2.5440319061279295
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,6144,2560,8,160,16,8,balanced,0.07890133559703827
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,6144,2560,8,160,8,16,power_law_1.2,0.06361600160598754
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,6144,2560,8,160,16,8,balanced,0.07889066636562347
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,6144,2560,8,160,8,16,power_law_1.2,0.06424959897994995
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,6144,2560,8,160,8,16,power_law_1.2,5.302336120605469
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,6144,2560,8,160,16,8,balanced,0.08097066481908162
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,6144,2560,8,160,8,16,power_law_1.2,0.06735360026359558
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,6144,2560,8,160,16,8,balanced,0.08155199885368347
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,6144,2560,8,160,8,16,power_law_1.2,0.07149440050125122
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,6144,2560,8,160,16,8,balanced,0.0813920001188914
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,6144,2560,8,160,8,16,power_law_1.2,0.07342079877853394
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,6144,2560,8,160,16,8,balanced,0.08303999900817871
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,6144,2560,8,160,16,8,balanced,0.0845973292986552
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,6144,2560,8,160,8,16,power_law_1.2,0.07633280158042907
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,6144,2560,8,160,16,8,balanced,0.08530666430791219
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,6144,2560,8,160,8,16,power_law_1.2,0.08060799837112427
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,6144,2560,8,160,16,8,balanced,0.0884320040543874
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,6144,2560,8,160,8,16,power_law_1.2,0.0953984022140503
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,6144,2560,8,160,16,8,balanced,0.09267200032869975
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,6144,2560,8,160,16,8,balanced,0.04604800045490265
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,6144,2560,8,160,8,16,power_law_1.2,0.09898239970207215
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,6144,2560,8,160,16,8,balanced,0.09345066547393799
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,6144,2560,8,160,16,8,balanced,0.046997333566347756
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,6144,2560,8,160,16,8,balanced,0.09675733248392741
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,6144,2560,8,160,16,8,balanced,0.05163733164469401
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,6144,2560,8,160,8,16,power_law_1.2,0.10883200168609619
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,6144,2560,8,160,16,8,balanced,0.05417599777380625
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,6144,2560,8,160,16,8,balanced,0.14526399970054626
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,6144,2560,8,160,16,8,balanced,0.06435733536879222
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,6144,2560,8,160,16,8,balanced,0.11586667100588481
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,6144,2560,8,160,8,16,power_law_1.2,0.13296639919281006
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,6144,2560,8,160,16,8,balanced,0.06986133257548015
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,6144,2560,8,160,16,8,balanced,0.07065600156784058
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,6144,2560,8,160,8,16,power_law_1.2,0.14739840030670165
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,6144,2560,8,160,16,8,balanced,0.14566399653752646
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,6144,2560,8,160,16,8,balanced,0.07134933272997539
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,6144,2560,8,160,16,8,balanced,0.07217599948247273
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,6144,2560,8,160,16,8,balanced,0.14727999766667685
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,6144,2560,8,160,16,8,balanced,0.0728959987560908
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,6144,2560,8,160,8,16,power_law_1.2,0.18634239435195923
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,6144,2560,8,160,16,8,balanced,0.07459199925263722
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,6144,2560,8,160,16,8,balanced,0.07445866862932841
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,6144,2560,8,160,16,8,balanced,0.22801599899927774
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,6144,2560,8,160,8,16,power_law_1.2,0.25884160995483396
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,6144,2560,8,160,16,8,balanced,0.0763626645008723
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,6144,2560,8,160,16,8,balanced,0.07936533292134602
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,6144,2560,8,160,8,16,power_law_1.2,0.37711999416351316
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,6144,2560,8,160,16,8,balanced,0.0855466624101003
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,6144,2560,8,160,16,8,balanced,0.22233599424362183
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,6144,2560,8,160,8,16,power_law_1.2,0.468064022064209
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,6144,2560,8,160,16,8,balanced,0.08846933643023173
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,6144,2560,8,160,16,8,power_law_1.01,0.062431997060775755
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,6144,2560,8,160,16,8,balanced,0.09089600046475728
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,6144,2560,8,160,8,16,power_law_1.2,0.7467072010040283
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,6144,2560,8,160,16,8,power_law_1.01,0.06485120058059693
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,6144,2560,8,160,16,8,balanced,0.34568532307942706
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,6144,2560,8,160,16,8,balanced,0.118559996287028
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,6144,2560,8,160,16,8,power_law_1.01,0.05505920052528381
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,6144,2560,8,160,8,16,power_law_1.2,0.896889591217041
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,6144,2560,8,160,16,8,balanced,0.1139359970887502
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,6144,2560,8,160,16,8,power_law_1.01,0.06431999802589417
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,6144,2560,8,160,8,16,power_law_1.2,1.4522624015808105
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,6144,2560,8,160,16,8,power_law_1.01,0.06944000124931335
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,6144,2560,8,160,16,8,balanced,0.14149866501490274
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,6144,2560,8,160,8,16,power_law_1.2,2.1251392364501953
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,6144,2560,8,160,16,8,power_law_1.01,0.07834879755973816
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,6144,2560,8,160,16,8,balanced,0.37652798493703205
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,6144,2560,8,160,16,8,power_law_1.01,0.07936639785766601
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,6144,2560,8,160,8,16,power_law_1.2,2.625984001159668
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,6144,2560,8,160,16,8,balanced,0.15366933743158975
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,6144,2560,8,160,16,8,balanced,0.04312000175317129
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,6144,2560,8,160,16,8,power_law_1.01,0.08111360073089599
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,6144,2560,8,160,16,8,balanced,0.04554666578769684
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,6144,2560,8,160,8,16,power_law_1.2,4.287238311767578
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,6144,2560,8,160,16,8,power_law_1.01,0.0815999984741211
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,6144,2560,8,160,16,8,balanced,0.21766400337219238
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,6144,2560,8,160,16,8,balanced,0.04703466594219208
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,6144,2560,8,160,16,8,power_law_1.01,0.08505600094795226
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,6144,2560,8,160,16,8,balanced,0.05222400029500326
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,6144,2560,8,160,8,16,power_law_1.2,9.09793930053711
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,6144,2560,8,160,16,8,power_law_1.01,0.08727040290832519
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,6144,2560,8,160,16,8,balanced,0.5770933230717977
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,6144,2560,8,160,16,8,balanced,0.06333333253860474
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,6144,2560,8,160,16,8,balanced,0.2521066665649414
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,6144,2560,8,160,16,8,power_law_1.01,0.09181439876556396
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,6144,2560,8,160,16,8,balanced,0.06922133266925812
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,6144,2560,8,160,16,8,balanced,0.07077866792678833
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,6144,2560,8,160,16,8,power_law_1.01,0.09503359794616699
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,6144,2560,8,160,16,8,power_law_1.01,0.05260800123214722
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,6144,2560,8,160,16,8,balanced,0.07116800049940745
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,6144,2560,8,160,16,8,power_law_1.01,0.09613440036773682
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,6144,2560,8,160,16,8,balanced,0.3575413227081299
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,6144,2560,8,160,16,8,power_law_1.01,0.05397120118141174
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,6144,2560,8,160,16,8,balanced,0.07239466905593872
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,6144,2560,8,160,16,8,power_law_1.01,0.1067199945449829
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,6144,2560,8,160,16,8,power_law_1.01,0.053311997652053834
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,6144,2560,8,160,16,8,balanced,0.07361599802970886
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,6144,2560,8,160,16,8,power_law_1.01,0.11408640146255493
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,6144,2560,8,160,16,8,power_law_1.01,0.05518720149993896
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,6144,2560,8,160,16,8,balanced,0.07484800120194753
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,6144,2560,8,160,16,8,power_law_1.01,0.12885760068893432
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,6144,2560,8,160,16,8,balanced,0.6944746971130371
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,6144,2560,8,160,16,8,power_law_1.01,0.05994880199432373
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,6144,2560,8,160,16,8,balanced,0.44649068514506024
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,6144,2560,8,160,16,8,balanced,0.07656000057856242
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,6144,2560,8,160,16,8,power_law_1.01,0.1542080044746399
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,6144,2560,8,160,16,8,power_law_1.01,0.06650879979133606
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,6144,2560,8,160,16,8,balanced,0.07916800181070964
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,6144,2560,8,160,16,8,power_law_1.01,0.15162880420684816
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,6144,2560,8,160,16,8,power_law_1.01,0.06851840019226074
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,6144,2560,8,160,16,8,balanced,0.08214933176835378
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,6144,2560,8,160,16,8,power_law_1.01,0.18201600313186644
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,6144,2560,8,160,16,8,power_law_1.01,0.06835200190544129
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,6144,2560,8,160,16,8,power_law_1.01,0.21106560230255128
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,6144,2560,8,160,16,8,balanced,0.0872213343779246
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,6144,2560,8,160,16,8,power_law_1.01,0.07030400037765502
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,6144,2560,8,160,16,8,power_law_1.01,0.27182080745697024
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,6144,2560,8,160,16,8,power_law_1.01,0.07238399982452393
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,6144,2560,8,160,16,8,balanced,0.657093326250712
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,6144,2560,8,160,16,8,power_law_1.01,0.30471680164337156
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,6144,2560,8,160,16,8,balanced,0.09607999523480733
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,6144,2560,8,160,16,8,power_law_1.01,0.0748799979686737
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,6144,2560,8,160,16,8,power_law_1.01,0.4356800079345703
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,6144,2560,8,160,16,8,power_law_1.01,0.07928320169448852
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,6144,2560,8,160,16,8,balanced,0.7969066301981608
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,6144,2560,8,160,16,8,power_law_1.01,0.5468671798706055
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,6144,2560,8,160,16,8,balanced,0.10382933417956035
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,6144,2560,8,160,16,8,power_law_1.01,0.08379520177841186
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,6144,2560,8,160,16,8,power_law_1.01,0.7440512180328369
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,6144,2560,8,160,16,8,power_law_1.01,0.08456959724426269
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,6144,2560,8,160,16,8,power_law_1.01,0.09284480214118958
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,6144,2560,8,160,16,8,power_law_1.01,0.9441280364990234
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,6144,2560,8,160,16,8,power_law_1.01,0.09868800044059753
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,6144,2560,8,160,16,8,balanced,0.8175360361735026
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,6144,2560,8,160,16,8,power_law_1.01,1.3085760116577148
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,6144,2560,8,160,16,8,balanced,0.11923199892044067
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,6144,2560,8,160,16,8,power_law_1.01,0.10967040061950684
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,6144,2560,8,160,16,8,power_law_1.01,1.7479936599731445
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,6144,2560,8,160,16,8,power_law_1.01,0.1317055940628052
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,6144,2560,8,160,16,8,balanced,0.1323466698328654
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,6144,2560,8,160,16,8,power_law_1.01,0.13679360151290892
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,6144,2560,8,160,16,8,power_law_1.01,3.952006530761719
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,6144,2560,8,160,16,8,power_law_1.01,0.17147519588470458
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,6144,2560,8,160,16,8,power_law_1.01,0.20483839511871338
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,6144,2560,8,160,16,8,power_law_1.01,0.25032958984375
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,6144,2560,8,160,16,8,balanced,0.1649493376413981
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,6144,2560,8,160,16,8,power_law_1.01,0.3116544008255005
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,6144,2560,8,160,16,8,balanced,0.9794080257415771
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,6144,2560,8,160,16,8,balanced,1.2893706957499187
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,6144,2560,8,160,16,8,balanced,0.20321067174275717
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,6144,2560,8,160,16,8,power_law_1.01,0.4470719814300537
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,6144,2560,8,160,16,8,power_law_1.01,0.5501503944396973
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,6144,2560,8,160,16,8,balanced,0.30645867188771564
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,6144,2560,8,160,16,8,power_law_1.01,0.8580160140991211
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,6144,2560,8,160,16,8,power_law_1.01,1.0547327995300293
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,6144,2560,8,160,16,8,power_law_1.01,0.05348479747772217
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,6144,2560,8,160,16,8,balanced,0.37570667266845703
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,6144,2560,8,160,16,8,power_law_1.01,0.05729920268058777
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,6144,2560,8,160,16,8,power_law_1.01,1.3581503868103026
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,6144,2560,8,160,16,8,power_law_1.01,0.04904319941997528
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,6144,2560,8,160,16,8,power_law_1.01,2.2542848587036133
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,6144,2560,8,160,16,8,power_law_1.01,0.05496320128440857
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,6144,2560,8,160,16,8,power_law_1.01,0.05809919834136963
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,6144,2560,8,160,16,8,power_law_1.01,0.0664255976676941
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,6144,2560,8,160,16,8,power_law_1.01,4.112275314331055
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,6144,2560,8,160,16,8,power_law_1.01,0.07006719708442688
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,6144,2560,8,160,16,8,power_law_1.01,0.07071999907493591
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,6144,2560,8,160,16,8,balanced,0.5276906490325928
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,6144,2560,8,160,16,8,power_law_1.01,0.0732096016407013
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,6144,2560,8,160,16,8,power_law_1.01,0.07684479951858521
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,6144,2560,8,160,16,8,power_law_1.01,0.0797760009765625
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,6144,2560,8,160,16,8,power_law_1.01,0.08387839794158936
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,6144,2560,8,160,16,8,balanced,1.555514653523763
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,6144,2560,8,160,16,8,power_law_1.01,0.08943359851837158
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,6144,2560,8,160,16,8,power_law_1.01,0.09384959936141968
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,6144,2560,8,160,16,8,balanced,0.6822559833526611
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,6144,2560,8,160,16,8,power_law_1.01,0.10705920457839965
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,6144,2560,8,160,16,8,power_law_1.01,0.11510399580001832
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,6144,2560,8,160,16,8,power_law_1.2,0.06247040033340454
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,6144,2560,8,160,16,8,power_law_1.01,0.12810239791870118
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,6144,2560,8,160,16,8,power_law_1.2,0.0580672025680542
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,6144,2560,8,160,16,8,power_law_1.2,0.05583360195159912
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,6144,2560,8,160,16,8,power_law_1.2,0.06270719766616821
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,6144,2560,8,160,16,8,balanced,0.982373317082723
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,6144,2560,8,160,16,8,power_law_1.01,0.1444416046142578
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,6144,2560,8,160,16,8,power_law_1.2,0.06757760047912598
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,6144,2560,8,160,16,8,power_law_1.01,0.16725759506225585
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,6144,2560,8,160,16,8,power_law_1.2,0.0775168001651764
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,6144,2560,8,160,16,8,power_law_1.2,0.08061439990997314
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,6144,2560,8,160,16,8,power_law_1.2,0.0803712010383606
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,6144,2560,8,160,16,8,power_law_1.01,0.23104639053344728
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,6144,2560,8,160,16,8,power_law_1.2,0.08419839739799499
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,6144,2560,8,160,16,8,power_law_1.01,0.29900801181793213
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,6144,2560,8,160,16,8,power_law_1.2,0.0844543993473053
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,6144,2560,8,160,16,8,balanced,2.4369707107543945
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,6144,2560,8,160,16,8,power_law_1.01,0.42075519561767577
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,6144,2560,8,160,16,8,power_law_1.2,0.09085440039634704
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,6144,2560,8,160,16,8,power_law_1.01,0.5528192043304443
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,6144,2560,8,160,16,8,power_law_1.2,0.09439359903335572
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,6144,2560,8,160,16,8,balanced,1.29148268699646
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,6144,2560,8,160,16,8,power_law_1.2,0.10565760135650634
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,6144,2560,8,160,16,8,power_law_1.01,0.7572927951812745
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,6144,2560,8,160,16,8,power_law_1.2,0.09968000054359435
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,6144,2560,8,160,16,8,power_law_1.01,1.1363903999328613
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,6144,2560,8,160,16,8,power_law_1.01,1.5311039924621581
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,6144,2560,8,160,16,8,power_law_1.2,0.11115520000457764
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,6144,2560,8,160,16,8,power_law_1.01,1.922105598449707
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,6144,2560,8,160,16,8,power_law_1.2,0.11176960468292237
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,6144,2560,8,160,16,8,power_law_1.01,2.5023935317993162
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,6144,2560,8,160,16,8,power_law_1.2,0.14053759574890137
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,6144,2560,8,160,16,8,power_law_1.01,3.654790496826172
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,6144,2560,8,160,16,8,power_law_1.2,0.1624127984046936
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,6144,2560,8,160,16,8,power_law_1.2,0.15660799741744996
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,6144,2560,8,160,16,8,power_law_1.01,7.7104637145996096
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,6144,2560,8,160,16,8,power_law_1.2,0.20468480587005616
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,6144,2560,8,160,16,8,balanced,1.574933369954427
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,6144,2560,8,160,16,8,power_law_1.2,0.2161792039871216
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,6144,2560,8,160,16,8,balanced,3.035285313924154
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,6144,2560,8,160,16,8,power_law_1.2,0.28784639835357667
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,6144,2560,8,160,16,8,power_law_1.2,0.35292160511016846
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,6144,2560,8,160,16,8,power_law_1.2,0.4882239818572998
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,6144,2560,8,160,16,8,power_law_1.2,0.588102388381958
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,6144,2560,8,160,16,8,power_law_1.2,0.8065535545349121
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,6144,2560,8,160,16,8,power_law_1.2,1.1241408348083497
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,6144,2560,8,160,16,8,power_law_1.2,0.053491199016571046
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,6144,2560,8,160,16,8,power_law_1.2,1.3950400352478027
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,6144,2560,8,160,16,8,power_law_1.2,0.04843519926071167
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,6144,2560,8,160,16,8,power_law_1.2,2.487980842590332
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,6144,2560,8,160,16,8,power_law_1.2,0.051648002862930295
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,6144,2560,8,160,16,8,power_law_1.2,5.003225708007813
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,6144,2560,8,160,16,8,power_law_1.2,0.055219197273254396
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,6144,2560,8,160,16,8,balanced,2.4780373573303223
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,6144,2560,8,160,16,8,power_law_1.2,0.05932160019874573
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,6144,2560,8,160,16,8,power_law_1.2,0.06696959733963012
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,6144,2560,8,160,16,8,power_law_1.2,0.06763520240783691
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,6144,2560,8,160,16,8,power_law_1.2,0.06997759938240052
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,6144,2560,8,160,16,8,power_law_1.2,0.07152000069618225
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,6144,2560,8,160,16,8,power_law_1.2,0.07310079932212829
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,6144,2560,8,160,16,8,power_law_1.2,0.07692800164222717
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,6144,2560,8,160,16,8,power_law_1.2,0.07897599935531616
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,6144,2560,8,160,16,8,power_law_1.2,0.08774399757385254
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,6144,2560,8,160,16,8,power_law_1.2,0.08714240193367004
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,6144,2560,8,160,16,8,power_law_1.2,0.09368320107460022
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,6144,2560,8,160,16,8,power_law_1.2,0.10443520545959473
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,6144,2560,8,160,16,8,power_law_1.2,0.11282559633255004
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,6144,2560,8,160,16,8,power_law_1.2,0.13484159708023072
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,6144,2560,8,160,16,8,power_law_1.2,0.1405184030532837
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,6144,2560,8,160,16,8,power_law_1.2,0.17851519584655762
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,6144,2560,8,160,16,8,power_law_1.2,0.21699841022491456
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,6144,2560,8,160,16,8,power_law_1.2,0.29418239593505857
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,6144,2560,8,160,16,8,power_law_1.2,0.05334399938583374
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,6144,2560,8,160,16,8,power_law_1.2,0.3462975978851318
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,6144,2560,8,160,16,8,power_law_1.2,0.04699519872665405
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,6144,2560,8,160,16,8,power_law_1.2,0.47618560791015624
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,6144,2560,8,160,16,8,power_law_1.2,0.04847359955310822
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,6144,2560,8,160,16,8,power_law_1.2,0.05569919943809509
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,6144,2560,8,160,16,8,power_law_1.2,0.5937088012695313
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,6144,2560,8,160,16,8,balanced,4.933269182840983
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,6144,2560,8,160,16,8,power_law_1.2,0.059564799070358276
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,6144,2560,8,160,16,8,power_law_1.2,0.9034943580627441
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,6144,2560,8,160,16,8,power_law_1.2,0.06696320176124573
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,6144,2560,8,160,16,8,power_law_1.2,1.147929573059082
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,6144,2560,8,160,16,8,power_law_1.2,0.07059199810028076
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,6144,2560,8,160,16,8,power_law_1.2,1.593990421295166
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,6144,2560,8,160,16,8,power_law_1.2,0.07047039866447449
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,6144,2560,8,160,16,8,power_law_1.2,0.07330560088157653
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,6144,2560,8,160,16,8,power_law_1.2,2.5607872009277344
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,6144,2560,8,160,16,8,power_law_1.2,0.07827200293540955
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,6144,2560,8,160,16,8,power_law_1.2,0.07998080253601074
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,6144,2560,8,160,16,8,power_law_1.2,5.813407897949219
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,6144,2560,8,160,32,4,balanced,0.05162666738033295
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,6144,2560,8,160,16,8,power_law_1.2,0.0845632016658783
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,6144,2560,8,160,32,4,balanced,0.053914666175842285
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,6144,2560,8,160,16,8,power_law_1.2,0.09076480269432068
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,6144,2560,8,160,32,4,balanced,0.05608533322811127
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,6144,2560,8,160,32,4,balanced,0.0690773328145345
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,6144,2560,8,160,16,8,power_law_1.2,0.09858559966087341
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,6144,2560,8,160,32,4,balanced,0.0846720039844513
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,6144,2560,8,160,16,8,power_law_1.2,0.11073280572891235
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,6144,2560,8,160,32,4,balanced,0.09134399890899658
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,6144,2560,8,160,32,4,balanced,0.09185600280761719
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,6144,2560,8,160,16,8,power_law_1.2,0.11593600511550903
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,6144,2560,8,160,32,4,balanced,0.0918293297290802
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,6144,2560,8,160,32,4,balanced,0.09159466624259949
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,6144,2560,8,160,16,8,power_law_1.2,0.1358847975730896
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,6144,2560,8,160,32,4,balanced,0.09249066313107808
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,6144,2560,8,160,32,4,balanced,0.09409067034721375
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,6144,2560,8,160,32,4,balanced,0.09618666768074036
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,6144,2560,8,160,16,8,power_law_1.2,0.1518272042274475
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,6144,2560,8,160,32,4,balanced,0.09506666660308838
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,6144,2560,8,160,16,8,power_law_1.2,0.17932800054550171
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,6144,2560,8,160,32,4,balanced,0.0992746651172638
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,6144,2560,8,160,32,4,balanced,0.10589866836865743
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,6144,2560,8,160,32,4,balanced,0.12804800271987915
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,6144,2560,8,160,16,8,power_law_1.2,0.23720960617065429
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,6144,2560,8,160,32,4,balanced,0.11195733149846394
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,6144,2560,8,160,16,8,power_law_1.2,0.32359039783477783
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,6144,2560,8,160,32,4,balanced,0.1625920037428538
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,6144,2560,8,160,16,8,power_law_1.2,0.4684864044189453
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,6144,2560,8,160,32,4,balanced,0.145797332127889
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,6144,2560,8,160,16,8,power_law_1.2,0.5648064136505127
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,6144,2560,8,160,32,4,balanced,0.19137599070866904
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,6144,2560,8,160,16,8,power_law_1.2,0.9157376289367676
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,6144,2560,8,160,32,4,balanced,0.046570668617884316
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,6144,2560,8,160,16,8,power_law_1.2,1.235257625579834
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,6144,2560,8,160,32,4,balanced,0.18861865997314453
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,6144,2560,8,160,32,4,balanced,0.04888000090916952
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,6144,2560,8,160,16,8,power_law_1.2,1.8664960861206055
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,6144,2560,8,160,32,4,balanced,0.05046933392683665
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,6144,2560,8,160,32,4,balanced,0.058117335041364036
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,6144,2560,8,160,32,4,balanced,0.28758933146794635
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,6144,2560,8,160,16,8,power_law_1.2,2.24768009185791
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,6144,2560,8,160,32,4,balanced,0.07055466870466869
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,6144,2560,8,160,16,8,power_law_1.2,2.4758975982666014
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,6144,2560,8,160,32,4,balanced,0.07782933115959167
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,6144,2560,8,160,32,4,balanced,0.3222986658414205
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,6144,2560,8,160,32,4,balanced,0.08038933575153351
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,6144,2560,8,160,16,8,power_law_1.2,5.297580718994141
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,6144,2560,8,160,32,4,power_law_1.01,0.054816001653671266
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,6144,2560,8,160,32,4,balanced,0.08032533526420593
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,6144,2560,8,160,32,4,power_law_1.01,0.06551679968833923
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,6144,2560,8,160,32,4,balanced,0.08161066472530365
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,6144,2560,8,160,16,8,power_law_1.2,8.916896057128906
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,6144,2560,8,160,32,4,power_law_1.01,0.05605760216712952
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,6144,2560,8,160,32,4,balanced,0.08201600114504497
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,6144,2560,8,160,32,4,balanced,0.4912373224894206
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,6144,2560,8,160,32,4,power_law_1.01,0.06314240097999572
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,6144,2560,8,160,32,4,balanced,0.08403733372688293
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,6144,2560,8,160,32,4,power_law_1.01,0.06962559819221496
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,6144,2560,8,160,32,4,balanced,0.08515733480453491
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,6144,2560,8,160,32,4,power_law_1.01,0.08432000279426574
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,6144,2560,8,160,32,4,balanced,0.08704533179601033
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,6144,2560,8,160,32,4,power_law_1.01,0.0876800000667572
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,6144,2560,8,160,32,4,balanced,0.5821919838587443
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,6144,2560,8,160,32,4,balanced,0.09074133634567261
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,6144,2560,8,160,32,4,power_law_1.01,0.09019520282745361
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,6144,2560,8,160,32,4,balanced,0.09848533074061076
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,6144,2560,8,160,32,4,power_law_1.01,0.09111040234565734
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,6144,2560,8,160,32,4,balanced,0.1020906666914622
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,6144,2560,8,160,32,4,power_law_1.01,0.09306880235671997
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,6144,2560,8,160,32,4,balanced,0.10805867115656535
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,6144,2560,8,160,32,4,power_law_1.01,0.09352319836616516
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,6144,2560,8,160,32,4,power_law_1.01,0.09598720073699951
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,6144,2560,8,160,32,4,balanced,0.1553439994653066
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,6144,2560,8,160,32,4,balanced,0.8659413655598959
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,6144,2560,8,160,32,4,power_law_1.01,0.1023103952407837
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,6144,2560,8,160,32,4,balanced,0.14044800400733948
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,6144,2560,8,160,32,4,power_law_1.01,0.04883840084075928
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,6144,2560,8,160,32,4,power_law_1.01,0.11235840320587158
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,6144,2560,8,160,32,4,power_law_1.01,0.1282688021659851
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,6144,2560,8,160,32,4,power_law_1.01,0.054048001766204834
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,6144,2560,8,160,32,4,balanced,0.1830186645189921
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,6144,2560,8,160,32,4,power_law_1.01,0.05027840137481689
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,6144,2560,8,160,32,4,power_law_1.01,0.13882880210876464
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,6144,2560,8,160,32,4,power_law_1.01,0.05902079939842224
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,6144,2560,8,160,32,4,power_law_1.01,0.13549439907073973
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,6144,2560,8,160,32,4,balanced,0.194815993309021
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,6144,2560,8,160,32,4,power_law_1.01,0.062431997060775755
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,6144,2560,8,160,32,4,power_law_1.01,0.17004799842834473
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,6144,2560,8,160,32,4,power_law_1.01,0.07319039702415467
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,6144,2560,8,160,32,4,power_law_1.01,0.17271679639816284
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,6144,2560,8,160,32,4,power_law_1.01,0.07544959783554077
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,6144,2560,8,160,32,4,balanced,0.2863146662712097
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,6144,2560,8,160,32,4,power_law_1.01,0.07782400250434876
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,6144,2560,8,160,32,4,power_law_1.01,0.20606720447540283
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,6144,2560,8,160,32,4,balanced,1.041647990544637
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,6144,2560,8,160,32,4,power_law_1.01,0.08037760257720947
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,6144,2560,8,160,32,4,power_law_1.01,0.2513279914855957
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,6144,2560,8,160,32,4,power_law_1.01,0.08008319735527039
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,6144,2560,8,160,32,4,power_law_1.01,0.08733440041542054
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,6144,2560,8,160,32,4,power_law_1.01,0.3042112112045288
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,6144,2560,8,160,32,4,balanced,0.34124799569447833
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,6144,2560,8,160,32,4,power_law_1.01,0.0907904028892517
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,6144,2560,8,160,32,4,power_law_1.01,0.38226559162139895
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,6144,2560,8,160,32,4,power_law_1.01,0.09300479888916016
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,6144,2560,8,160,32,4,power_law_1.01,0.5680704116821289
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,6144,2560,8,160,32,4,power_law_1.01,0.09630720019340515
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,6144,2560,8,160,32,4,power_law_1.01,0.10575360059738159
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,6144,2560,8,160,32,4,power_law_1.01,0.7190080165863038
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,6144,2560,8,160,32,4,balanced,0.49321067333221436
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,6144,2560,8,160,32,4,power_law_1.01,0.11447679996490479
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,6144,2560,8,160,32,4,power_law_1.01,0.9586560249328613
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,6144,2560,8,160,32,4,power_law_1.01,0.12788480520248413
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,6144,2560,8,160,32,4,power_law_1.01,1.3218175888061523
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,6144,2560,8,160,32,4,power_law_1.01,0.15912959575653077
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,6144,2560,8,160,32,4,power_law_1.01,0.1639232039451599
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,6144,2560,8,160,32,4,power_law_1.01,1.6251264572143556
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,6144,2560,8,160,32,4,balanced,1.2254400253295898
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,6144,2560,8,160,32,4,power_law_1.01,0.2012864112854004
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,6144,2560,8,160,32,4,power_law_1.01,2.310291290283203
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,6144,2560,8,160,32,4,balanced,0.6435199975967407
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,6144,2560,8,160,32,4,power_law_1.01,0.2507008075714111
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,6144,2560,8,160,32,4,power_law_1.01,0.3118272066116333
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,6144,2560,8,160,32,4,power_law_1.01,4.825222396850586
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,6144,2560,8,160,32,4,power_law_1.01,0.39768319129943847
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,6144,2560,8,160,32,4,power_law_1.01,0.5574016094207763
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,6144,2560,8,160,32,4,power_law_1.01,0.6828351974487304
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,6144,2560,8,160,32,4,power_law_1.01,1.0069055557250977
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,6144,2560,8,160,32,4,balanced,0.9382080237070719
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,6144,2560,8,160,32,4,power_law_1.01,1.2811903953552246
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,6144,2560,8,160,32,4,power_law_1.01,1.8068223953247071
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,6144,2560,8,160,32,4,power_law_1.01,2.626323127746582
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,6144,2560,8,160,32,4,power_law_1.01,5.627264022827148
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,6144,2560,8,160,32,4,balanced,1.9478027025858562
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,6144,2560,8,160,32,4,balanced,1.154842694600423
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,6144,2560,8,160,32,4,power_law_1.2,0.05490559935569763
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,6144,2560,8,160,32,4,balanced,1.4119359652201335
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,6144,2560,8,160,32,4,power_law_1.2,0.05552639961242676
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,6144,2560,8,160,32,4,power_law_1.2,0.05548160076141358
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,6144,2560,8,160,32,4,power_law_1.2,0.06626560091972351
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,6144,2560,8,160,32,4,power_law_1.2,0.0699072003364563
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,6144,2560,8,160,32,4,power_law_1.2,0.08280959725379944
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,6144,2560,8,160,32,4,power_law_1.2,0.08775039911270141
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,6144,2560,8,160,32,4,power_law_1.2,0.09052159786224365
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,6144,2560,8,160,32,4,power_law_1.2,0.09056640267372132
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,6144,2560,8,160,32,4,power_law_1.2,0.09351680278778077
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,6144,2560,8,160,32,4,power_law_1.2,0.09464319944381713
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,6144,2560,8,160,32,4,power_law_1.2,0.10004479885101318
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,6144,2560,8,160,32,4,power_law_1.2,0.106387197971344
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,6144,2560,8,160,32,4,power_law_1.2,0.12647039890289308
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,6144,2560,8,160,32,4,power_law_1.2,0.133024001121521
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,6144,2560,8,160,32,4,balanced,2.1921706199645996
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,6144,2560,8,160,32,4,power_law_1.2,0.14416639804840087
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,6144,2560,8,160,32,4,power_law_1.2,0.14690560102462769
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,6144,2560,8,160,32,4,power_law_1.2,0.17878400087356566
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,6144,2560,8,160,32,4,power_law_1.2,0.18372479677200318
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,6144,2560,8,160,32,4,balanced,3.7474454243977866
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,6144,2560,8,160,32,4,power_law_1.2,0.22320001125335692
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,6144,2560,8,160,32,4,power_law_1.2,0.2581183910369873
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,6144,2560,8,160,32,4,power_law_1.2,0.34221439361572265
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,6144,2560,8,160,32,4,power_law_1.2,0.43505277633666994
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,6144,2560,8,160,32,4,power_law_1.2,0.6406527996063233
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,6144,2560,8,160,32,4,power_law_1.2,0.7283199787139892
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,6144,2560,8,160,32,4,power_law_1.2,1.0451775550842286
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,6144,2560,8,160,32,4,power_law_1.2,1.3980735778808593
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,6144,2560,8,160,32,4,power_law_1.2,1.7856639862060546
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,6144,2560,8,160,32,4,power_law_1.2,0.048902401328086854
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,6144,2560,8,160,32,4,power_law_1.2,2.601235198974609
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,6144,2560,8,160,32,4,power_law_1.2,0.04992640018463135
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,6144,2560,8,160,32,4,power_law_1.2,0.05117440223693848
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,6144,2560,8,160,32,4,power_law_1.2,6.628479766845703
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,6144,2560,8,160,32,4,power_law_1.2,0.055731201171875
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,6144,2560,8,160,32,4,power_law_1.2,0.06135680079460144
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,6144,2560,8,160,32,4,power_law_1.2,0.07363200187683105
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,6144,2560,8,160,32,4,power_law_1.2,0.07512320280075073
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,6144,2560,8,160,32,4,power_law_1.2,0.07845119833946228
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,6144,2560,8,160,32,4,power_law_1.2,0.08056319952011108
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,6144,2560,8,160,32,4,power_law_1.2,0.08341119885444641
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,6144,2560,8,160,32,4,power_law_1.2,0.08803840279579163
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,6144,2560,8,160,32,4,balanced,4.324501355489095
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,6144,2560,8,160,32,4,power_law_1.2,0.09254400134086609
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,6144,2560,8,160,32,4,power_law_1.2,0.096697598695755
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,6144,2560,8,160,32,4,power_law_1.2,0.09831680059432983
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,6144,2560,8,160,32,4,power_law_1.2,0.11104639768600463
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,6144,2560,8,160,32,4,power_law_1.2,0.11683839559555054
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,6144,2560,8,160,32,4,power_law_1.2,0.13344000577926635
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,6144,2560,8,160,32,4,power_law_1.2,0.16972800493240356
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,6144,2560,8,160,32,4,power_law_1.2,0.16127359867095947
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,6144,2560,8,160,32,4,power_law_1.2,0.21342079639434813
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,6144,2560,8,160,32,4,power_law_1.2,0.2542783975601196
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,6144,2560,8,160,32,4,power_law_1.2,0.3199295997619629
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,6144,2560,8,160,32,4,power_law_1.2,0.41125760078430174
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,6144,2560,8,160,32,4,power_law_1.2,0.6112127780914307
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,6144,2560,8,160,32,4,power_law_1.2,0.7994304180145264
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,6144,2560,8,160,32,4,power_law_1.2,1.2316991806030273
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,6144,2560,8,160,32,4,power_law_1.2,1.5940608024597167
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,7168,2048,8,384,1,128,balanced,0.19022933642069498
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,6144,2560,8,160,32,4,power_law_1.2,1.9090112686157226
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,7168,2048,8,384,1,128,balanced,0.18844799200693765
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,6144,2560,8,160,32,4,power_law_1.2,2.9832128524780273
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,7168,2048,8,384,1,128,balanced,0.1925333340962728
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,7168,2048,8,384,1,128,balanced,0.2015519936879476
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,6144,2560,8,160,32,4,power_law_1.2,6.8532157897949215
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,7168,2048,8,384,1,128,balanced,0.20360000928243002
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,7168,2048,8,384,1,128,balanced,0.3508533239364624
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,7168,2048,8,384,1,128,balanced,0.11678399642308553
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,7168,2048,8,384,1,128,balanced,0.5165280103683472
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,7168,2048,8,384,1,128,balanced,0.11608533064524333
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,7168,2048,8,384,1,128,balanced,0.5178720156351725
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,7168,2048,8,384,1,128,balanced,0.12098133563995361
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,7168,2048,8,384,1,128,balanced,0.5001493295033773
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,7168,2048,8,384,1,128,balanced,0.12050132950146993
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,7168,2048,8,384,1,128,balanced,0.5028479894002279
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,7168,2048,8,384,1,128,balanced,0.12035199999809265
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,7168,2048,8,384,1,128,balanced,0.5027893384297689
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,7168,2048,8,384,1,128,balanced,0.20698134104410806
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,7168,2048,8,384,1,128,balanced,0.2746559977531433
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,7168,2048,8,384,1,128,balanced,0.5092213153839111
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,7168,2048,8,384,1,128,balanced,0.3002240061759949
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,7168,2048,8,384,1,128,balanced,0.5196959972381592
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,7168,2048,8,384,1,128,balanced,0.3078666726748149
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,7168,2048,8,384,1,128,balanced,0.5205920139948527
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,7168,2048,8,384,1,128,balanced,0.283680001894633
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,7168,2048,8,384,1,128,balanced,0.5114133358001709
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,7168,2048,8,384,1,128,balanced,0.31989334026972455
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,7168,2048,8,384,1,128,balanced,0.5179306666056315
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,7168,2048,8,384,1,128,balanced,0.28385066986083984
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,7168,2048,8,384,1,128,balanced,0.49956798553466797
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,7168,2048,8,384,1,128,balanced,0.29397332668304443
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,7168,2048,8,384,1,128,balanced,0.5292319854100546
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,7168,2048,8,384,1,128,balanced,0.29414933919906616
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,7168,2048,8,384,1,128,balanced,0.3014986713727315
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,7168,2048,8,384,1,128,balanced,0.502458651860555
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,7168,2048,8,384,1,128,balanced,0.30029332637786865
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,7168,2048,8,384,1,128,balanced,0.49737600485483807
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,7168,2048,8,384,1,128,balanced,0.31433600187301636
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,7168,2048,8,384,1,128,balanced,0.49616531531016034
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,7168,2048,8,384,1,128,balanced,0.3169493277867635
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,7168,2048,8,384,1,128,balanced,0.3248053391774495
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,7168,2048,8,384,1,128,balanced,0.5238399902979533
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,7168,2048,8,384,1,128,balanced,0.32977600892384845
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,7168,2048,8,384,1,128,balanced,0.3522453308105469
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,7168,2048,8,384,1,128,balanced,0.4646720091501872
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,7168,2048,8,384,1,128,balanced,0.36128000418345135
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,7168,2048,8,384,1,128,balanced,0.3866453170776367
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,7168,2048,8,384,1,128,balanced,0.3740319808324178
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,7168,2048,8,384,1,128,power_law_1.01,0.5112063884735107
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,7168,2048,8,384,1,128,balanced,0.05068266888459524
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,7168,2048,8,384,1,128,power_law_1.01,0.5192959785461426
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,7168,2048,8,384,1,128,power_law_1.01,0.5220160007476806
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,7168,2048,8,384,1,128,balanced,0.8780426979064941
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,7168,2048,8,384,1,128,balanced,0.05016533533732096
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,7168,2048,8,384,1,128,balanced,0.3964213530222575
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,7168,2048,8,384,1,128,power_law_1.01,0.3998528003692627
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,7168,2048,8,384,1,128,balanced,0.05115200082461039
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,7168,2048,8,384,1,128,power_law_1.01,0.4097919940948486
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,7168,2048,8,384,1,128,balanced,0.05390933156013489
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,7168,2048,8,384,1,128,power_law_1.01,0.4263807773590088
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,7168,2048,8,384,1,128,balanced,0.054197331269582115
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,7168,2048,8,384,1,128,power_law_1.01,0.44884481430053713
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,7168,2048,8,384,1,128,balanced,0.06817600131034851
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,7168,2048,8,384,1,128,balanced,0.07956799864768982
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,7168,2048,8,384,1,128,power_law_1.01,0.4942336082458496
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,7168,2048,8,384,1,128,balanced,0.6898559729258219
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,7168,2048,8,384,1,128,balanced,0.07938666641712189
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,7168,2048,8,384,1,128,power_law_1.01,0.5116415977478027
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,7168,2048,8,384,1,128,balanced,0.08019733428955078
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,7168,2048,8,384,1,128,balanced,0.7135360240936279
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,7168,2048,8,384,1,128,power_law_1.01,0.5081024169921875
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,7168,2048,8,384,1,128,balanced,0.08019733428955078
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,7168,2048,8,384,1,128,power_law_1.01,0.46941437721252444
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,7168,2048,8,384,1,128,balanced,0.08237866560618083
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,7168,2048,8,384,1,128,power_law_1.01,0.4670207977294922
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,7168,2048,8,384,1,128,balanced,0.0828000009059906
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,7168,2048,8,384,1,128,power_law_1.01,0.4351679801940918
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,7168,2048,8,384,1,128,balanced,0.08448533217112224
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,7168,2048,8,384,1,128,power_law_1.01,0.48836479187011717
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,7168,2048,8,384,1,128,balanced,0.08515200018882751
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,7168,2048,8,384,1,128,balanced,0.731706698735555
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,7168,2048,8,384,1,128,power_law_1.01,0.4796288013458252
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,7168,2048,8,384,1,128,balanced,0.09081600109736125
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,7168,2048,8,384,1,128,power_law_1.01,0.44039039611816405
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,7168,2048,8,384,1,128,balanced,0.09248532851537068
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,7168,2048,8,384,1,128,power_law_1.01,0.4752064228057861
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,7168,2048,8,384,1,128,balanced,0.09577600161234538
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,7168,2048,8,384,1,128,power_law_1.01,0.3950079917907715
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,7168,2048,8,384,1,128,balanced,1.1633013089497883
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,7168,2048,8,384,1,128,balanced,0.10517866412798564
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,7168,2048,8,384,1,128,power_law_1.01,0.42266240119934084
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,7168,2048,8,384,1,128,power_law_1.01,0.2965888023376465
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,7168,2048,8,384,1,128,power_law_1.01,0.56528639793396
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,7168,2048,8,384,1,128,power_law_1.01,0.3023360013961792
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,7168,2048,8,384,1,128,power_law_1.01,0.693779182434082
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,7168,2048,8,384,1,128,power_law_1.01,0.27127680778503416
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,7168,2048,8,384,1,128,power_law_1.01,0.9294912338256835
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,7168,2048,8,384,1,128,power_law_1.01,0.2072511911392212
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,7168,2048,8,384,1,128,power_law_1.01,1.2270015716552733
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,7168,2048,8,384,1,128,balanced,1.0693973700205486
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,384,1,128,balanced,0.11455999811490376
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,7168,2048,8,384,1,128,power_law_1.01,1.396288013458252
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,7168,2048,8,384,1,128,power_law_1.01,0.2668735980987549
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,7168,2048,8,384,1,128,power_law_1.01,1.8923328399658204
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,7168,2048,8,384,1,128,power_law_1.01,0.25966720581054686
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,7168,2048,8,384,1,128,power_law_1.01,0.256441593170166
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,7168,2048,8,384,1,128,power_law_1.01,2.7209728240966795
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,7168,2048,8,384,1,128,power_law_1.01,0.2828160047531128
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,7168,2048,8,384,1,128,power_law_1.01,3.897203063964844
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,7168,2048,8,384,1,128,balanced,1.5601174036661785
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,7168,2048,8,384,1,128,power_law_1.01,0.25331840515136717
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,7168,2048,8,384,1,128,power_law_1.01,4.553830337524414
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,7168,2048,8,384,1,128,power_law_1.01,0.28866560459136964
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,384,1,128,balanced,0.13274666666984558
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,7168,2048,8,384,1,128,power_law_1.01,0.07516800165176392
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,7168,2048,8,384,1,128,power_law_1.01,0.25617280006408694
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,7168,2048,8,384,1,128,power_law_1.01,7.519046020507813
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,7168,2048,8,384,1,128,power_law_1.01,0.28586881160736083
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,7168,2048,8,384,1,128,power_law_1.01,0.0720255970954895
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,384,1,128,balanced,0.14913599689801535
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,7168,2048,8,384,1,128,balanced,1.3806346257527669
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,7168,2048,8,384,1,128,power_law_1.01,13.966712951660156
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,7168,2048,8,384,1,128,power_law_1.01,0.26301438808441163
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,7168,2048,8,384,1,128,power_law_1.01,0.07057279944419861
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,7168,2048,8,384,1,128,power_law_1.01,0.27460479736328125
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,7168,2048,8,384,1,128,power_law_1.01,0.06405119895935059
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,384,1,128,balanced,0.17896000544230142
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,7168,2048,8,384,1,128,power_law_1.01,0.2801919937133789
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,7168,2048,8,384,1,128,power_law_1.01,0.06394240260124207
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,7168,2048,8,384,1,128,power_law_1.01,0.2842688083648682
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,7168,2048,8,384,1,128,power_law_1.01,0.06837120056152343
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,7168,2048,8,384,1,128,power_law_1.01,0.0775871992111206
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,7168,2048,8,384,1,128,power_law_1.01,0.27537920475006106
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,7168,2048,8,384,1,128,power_law_1.01,0.07624319791793824
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,7168,2048,8,384,1,128,power_law_1.01,0.2560640096664429
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,7168,2048,8,384,1,128,power_law_1.01,0.2815680027008057
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,7168,2048,8,384,1,128,power_law_1.01,0.07445759773254394
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,7168,2048,8,384,1,128,power_law_1.01,0.32138240337371826
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,7168,2048,8,384,1,128,power_law_1.01,0.08004480004310607
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,384,1,128,balanced,0.21463465690612793
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,7168,2048,8,384,1,128,balanced,2.3167999585469565
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,7168,2048,8,384,1,128,power_law_1.01,0.08122239708900451
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,7168,2048,8,384,1,128,power_law_1.01,0.44620161056518554
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,7168,2048,8,384,1,128,power_law_1.01,0.08319360017776489
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,7168,2048,8,384,1,128,power_law_1.01,0.5461696147918701
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,7168,2048,8,384,1,128,power_law_1.2,0.5116223812103271
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,7168,2048,8,384,1,128,power_law_1.01,0.08691840171813965
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,7168,2048,8,384,1,128,power_law_1.01,0.7054592132568359
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,384,1,128,balanced,0.27268266677856445
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,7168,2048,8,384,1,128,power_law_1.2,0.5061952114105225
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,7168,2048,8,384,1,128,balanced,2.067567984263102
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,7168,2048,8,384,1,128,power_law_1.01,0.9082240104675293
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,7168,2048,8,384,1,128,power_law_1.01,0.08934400081634522
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,7168,2048,8,384,1,128,power_law_1.2,0.48929920196533205
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,7168,2048,8,384,1,128,power_law_1.01,1.24072322845459
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,7168,2048,8,384,1,128,power_law_1.2,0.2967871904373169
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,7168,2048,8,384,1,128,power_law_1.01,0.10302079916000366
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,7168,2048,8,384,1,128,power_law_1.2,0.33461120128631594
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,7168,2048,8,384,1,128,power_law_1.01,0.10412160158157349
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,7168,2048,8,384,1,128,power_law_1.2,0.45477118492126467
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,7168,2048,8,384,1,128,power_law_1.2,0.3051455974578857
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,7168,2048,8,384,1,128,power_law_1.01,1.6129472732543946
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,7168,2048,8,384,1,128,power_law_1.2,0.4440447807312012
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,7168,2048,8,384,1,128,power_law_1.01,0.11667840480804444
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,7168,2048,8,384,1,128,power_law_1.2,0.27337601184844973
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,7168,2048,8,384,1,128,power_law_1.01,2.223577690124512
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,7168,2048,8,384,1,128,power_law_1.2,0.38172159194946287
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,7168,2048,8,384,1,128,power_law_1.2,0.20849919319152832
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,7168,2048,8,384,1,128,power_law_1.01,0.14737279415130616
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,384,1,128,balanced,0.3595999876658122
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,7168,2048,8,384,1,128,power_law_1.01,2.872787284851074
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,7168,2048,8,384,1,128,power_law_1.2,0.43649921417236326
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,7168,2048,8,384,1,128,power_law_1.2,0.21953918933868408
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,7168,2048,8,384,1,128,power_law_1.2,0.22291200160980223
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,7168,2048,8,384,1,128,power_law_1.2,0.5079616069793701
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,7168,2048,8,384,1,128,power_law_1.01,4.5369728088378904
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,384,1,128,power_law_1.01,0.15765119791030885
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,7168,2048,8,384,1,128,power_law_1.2,0.29431040287017823
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,7168,2048,8,384,1,128,power_law_1.2,0.47002239227294923
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,7168,2048,8,384,1,128,power_law_1.2,0.2896320104598999
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,7168,2048,8,384,1,128,power_law_1.2,0.4381824016571045
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,7168,2048,8,384,1,128,power_law_1.01,10.150592041015624
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,7168,2048,8,384,1,128,power_law_1.2,0.2620543956756592
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,384,1,128,balanced,0.4842666784922282
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,7168,2048,8,384,1,128,power_law_1.2,0.47280001640319824
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,384,1,128,power_law_1.01,0.17893760204315184
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,7168,2048,8,384,1,128,power_law_1.2,0.25525119304656985
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,7168,2048,8,384,1,128,power_law_1.2,0.47025279998779296
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,384,1,128,power_law_1.01,0.2178368091583252
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,7168,2048,8,384,1,128,power_law_1.2,0.28575360774993896
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,7168,2048,8,384,1,128,power_law_1.2,0.4212224006652832
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,7168,2048,8,384,1,128,power_law_1.2,0.2873663902282715
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,384,1,128,power_law_1.01,0.29282560348510744
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,7168,2048,8,384,1,128,power_law_1.2,0.4446591854095459
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,7168,2048,8,384,1,128,power_law_1.2,0.29524478912353513
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,7168,2048,8,384,1,128,power_law_1.2,0.4653632164001465
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,7168,2048,8,384,1,128,power_law_1.2,0.2612031936645508
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,7168,2048,8,384,1,128,power_law_1.2,0.40758399963378905
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,384,1,128,power_law_1.01,0.33050880432128904
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,384,1,128,balanced,0.6330560048421224
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,7168,2048,8,384,1,128,power_law_1.2,0.2591871976852417
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,7168,2048,8,384,1,128,power_law_1.2,0.5240320205688477
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,384,1,128,power_law_1.01,0.4587200164794922
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,7168,2048,8,384,1,128,power_law_1.2,0.5489471912384033
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,7168,2048,8,384,1,128,power_law_1.2,0.2553663969039917
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,7168,2048,8,384,1,128,balanced,4.0141652425130205
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,7168,2048,8,384,1,128,power_law_1.2,0.2252863883972168
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,7168,2048,8,384,1,128,power_law_1.2,0.6261184215545654
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,384,1,128,power_law_1.01,0.6437759876251221
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,7168,2048,8,384,1,128,power_law_1.2,0.30316801071166993
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,7168,2048,8,384,1,128,power_law_1.2,0.7107071876525879
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,384,1,128,power_law_1.01,0.9274815559387207
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,7168,2048,8,384,1,128,power_law_1.2,0.3313920021057129
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,7168,2048,8,384,1,128,balanced,3.8311360677083335
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,7168,2048,8,384,1,128,power_law_1.2,1.0035391807556153
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,384,1,128,power_law_1.01,1.2266624450683594
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,7168,2048,8,384,1,128,power_law_1.2,0.40500478744506835
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,7168,2048,8,384,1,128,power_law_1.2,1.246342372894287
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,384,1,128,power_law_1.01,1.4773311614990234
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,7168,2048,8,384,1,128,power_law_1.2,0.5144000053405762
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,384,1,128,balanced,0.7804373105367025
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,7168,2048,8,384,1,128,power_law_1.2,1.7850112915039062
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,7168,2048,8,384,1,128,power_law_1.2,0.6365056037902832
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,7168,2048,8,384,1,128,power_law_1.2,2.281286430358887
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,7168,2048,8,384,1,128,power_law_1.2,0.8253952026367187
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,7168,2048,8,384,1,128,power_law_1.2,4.242240142822266
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,7168,2048,8,384,1,128,power_law_1.2,1.1757247924804688
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,384,1,128,power_law_1.01,2.7731775283813476
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,7168,2048,8,384,1,128,power_law_1.2,1.5408063888549806
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,7168,2048,8,384,1,128,power_law_1.2,5.261503982543945
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,384,1,128,power_law_1.01,5.051923370361328
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,7168,2048,8,384,1,128,power_law_1.2,2.1398847579956053
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,7168,2048,8,384,1,128,power_law_1.2,6.341088104248047
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,7168,2048,8,384,1,128,power_law_1.2,3.4855167388916017
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,7168,2048,8,384,1,128,power_law_1.2,10.989075469970704
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,7168,2048,8,384,1,128,power_law_1.2,3.721030426025391
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,7168,2048,8,384,1,128,power_law_1.2,7.283251190185547
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,7168,2048,8,384,1,128,power_law_1.2,26.843377685546876
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,384,1,128,balanced,1.2380906740824382
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,7168,2048,8,384,1,128,power_law_1.2,16.421548461914064
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,7168,2048,8,384,1,128,power_law_1.2,0.07334399819374085
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,7168,2048,8,384,1,128,power_law_1.2,0.07264639735221863
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,7168,2048,8,384,1,128,power_law_1.2,0.06910079717636108
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,384,1,128,balanced,2.4026452700297036
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,7168,2048,8,384,1,128,power_law_1.2,0.06428160071372986
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,7168,2048,8,384,1,128,power_law_1.2,0.06474879980087281
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,7168,2048,8,384,1,128,power_law_1.2,0.07096959948539734
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,7168,2048,8,384,1,128,power_law_1.2,0.07407360076904297
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,7168,2048,8,384,1,128,power_law_1.2,0.07395200133323669
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,7168,2048,8,384,1,128,power_law_1.2,0.07930880188941955
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,7168,2048,8,384,1,128,power_law_1.2,0.08042880296707153
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,7168,2048,8,384,1,128,power_law_1.2,0.07728000283241272
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,7168,2048,8,384,1,128,power_law_1.2,0.08652799725532531
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,7168,2048,8,384,1,128,power_law_1.2,0.08490239977836608
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,7168,2048,8,384,1,128,power_law_1.2,0.09893760085105896
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,7168,2048,8,384,1,128,power_law_1.2,0.10357120037078857
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,7168,2048,8,384,1,128,power_law_1.2,0.11121280193328857
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,7168,2048,8,384,1,128,power_law_1.2,0.1291264057159424
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,7168,2048,8,384,1,128,power_law_1.2,0.1660863995552063
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,7168,2048,8,384,2,64,balanced,0.11288000146547954
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,384,1,128,power_law_1.2,0.19167360067367553
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,7168,2048,8,384,2,64,balanced,0.11294933160146077
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,7168,2048,8,384,2,64,balanced,0.11527466773986816
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,7168,2048,8,384,2,64,balanced,0.11874666810035706
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,384,1,128,power_law_1.2,0.20300159454345704
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,7168,2048,8,384,2,64,balanced,0.20669333140055338
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,7168,2048,8,384,2,64,balanced,0.3680906693140666
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,384,1,128,power_law_1.2,0.26370561122894287
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,7168,2048,8,384,2,64,balanced,0.5194400151570638
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,384,1,128,power_law_1.2,0.3633343935012817
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,7168,2048,8,384,2,64,balanced,0.5309493144353231
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,7168,2048,8,384,2,64,balanced,0.5489333470662435
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,7168,2048,8,384,2,64,balanced,0.5176533460617065
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,384,1,128,power_law_1.2,0.4111167907714844
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,7168,2048,8,384,2,64,balanced,0.5309706528981527
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,384,1,128,power_law_1.2,0.7404736042022705
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,7168,2048,8,384,2,64,balanced,0.5228319962819418
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,7168,2048,8,384,2,64,balanced,0.5692319869995117
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,7168,2048,8,384,2,64,balanced,0.5378133455912272
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,384,1,128,power_law_1.2,0.8422080039978027
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,7168,2048,8,384,2,64,balanced,0.5099200010299683
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,384,1,128,power_law_1.2,1.3582079887390137
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,7168,2048,8,384,2,64,balanced,0.5186613400777181
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,384,1,128,power_law_1.2,1.6785408020019532
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,7168,2048,8,384,2,64,balanced,0.5112320184707642
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,384,1,128,power_law_1.2,2.363871955871582
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,7168,2048,8,384,2,64,balanced,0.5075999895731608
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,7168,2048,8,384,2,64,balanced,0.5097440083821615
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,384,1,128,power_law_1.2,4.186227035522461
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,7168,2048,8,384,2,64,balanced,0.5086719989776611
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,7168,2048,8,384,2,64,balanced,0.07706666489442189
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,7168,2048,8,384,2,64,balanced,0.07810133198897044
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,384,1,128,power_law_1.2,7.751033782958984
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,7168,2048,8,384,2,64,balanced,0.5113653341929117
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,7168,2048,8,384,2,64,balanced,0.07878399888674419
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,7168,2048,8,384,2,64,balanced,0.08021333316961925
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,7168,2048,8,384,2,64,balanced,0.4914026657740275
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,7168,2048,8,384,2,64,balanced,0.1232373317082723
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,7168,2048,8,384,2,64,balanced,0.21564799547195435
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,7168,2048,8,384,2,64,balanced,0.2978079915046692
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,7168,2048,8,384,2,64,balanced,0.4801439841588338
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,7168,2048,8,384,2,64,balanced,0.3020640015602112
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,7168,2048,8,384,2,64,balanced,0.31831467151641846
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,7168,2048,8,384,2,64,balanced,0.3044000069300334
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,7168,2048,8,384,2,64,balanced,0.30083733797073364
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,7168,2048,8,384,2,64,balanced,0.4039253393809001
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,7168,2048,8,384,2,64,balanced,0.2988746762275696
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,7168,2048,8,384,2,64,balanced,0.2895573377609253
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,7168,2048,8,384,2,64,power_law_1.01,0.5184703826904297
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,7168,2048,8,384,2,64,balanced,0.2903466622034709
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,7168,2048,8,384,2,64,balanced,0.04493333399295807
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,7168,2048,8,384,2,64,power_law_1.01,0.5031871795654297
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,7168,2048,8,384,2,64,balanced,0.30962133407592773
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,7168,2048,8,384,2,64,balanced,0.9028586546579996
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,7168,2048,8,384,2,64,balanced,0.04539200166861216
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,7168,2048,8,384,2,64,power_law_1.01,0.5176959991455078
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,7168,2048,8,384,2,64,balanced,0.3223839998245239
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,7168,2048,8,384,2,64,balanced,0.045466666420300804
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,7168,2048,8,384,2,64,power_law_1.01,0.24407680034637452
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,7168,2048,8,384,2,64,balanced,0.30959999561309814
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,7168,2048,8,384,2,64,balanced,0.04869333406289419
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,7168,2048,8,384,2,64,power_law_1.01,0.337446403503418
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,7168,2048,8,384,2,64,balanced,0.3073333303133647
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,7168,2048,8,384,2,64,balanced,0.05176533261934916
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,7168,2048,8,384,2,64,power_law_1.01,0.40261120796203614
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,7168,2048,8,384,2,64,balanced,0.06829866766929626
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,7168,2048,8,384,2,64,balanced,0.31414933999379474
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,7168,2048,8,384,2,64,power_law_1.01,0.3054464101791382
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,7168,2048,8,384,2,64,balanced,0.07768533130486806
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,7168,2048,8,384,2,64,power_law_1.01,0.44406399726867674
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,7168,2048,8,384,2,64,balanced,0.7457333405812582
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,7168,2048,8,384,2,64,balanced,0.3426400025685628
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,7168,2048,8,384,2,64,balanced,0.07838400204976399
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,7168,2048,8,384,2,64,power_law_1.01,0.3010688066482544
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,7168,2048,8,384,2,64,power_law_1.01,0.4601856231689453
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,7168,2048,8,384,2,64,balanced,0.0788213312625885
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,7168,2048,8,384,2,64,power_law_1.01,0.29040639400482177
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,7168,2048,8,384,2,64,balanced,0.35601067543029785
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,7168,2048,8,384,2,64,power_law_1.01,0.4784895896911621
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,7168,2048,8,384,2,64,balanced,0.07902400195598602
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,7168,2048,8,384,2,64,power_law_1.01,0.1376960039138794
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,7168,2048,8,384,2,64,balanced,0.08027199904123943
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,7168,2048,8,384,2,64,power_law_1.01,0.07877119779586791
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,7168,2048,8,384,2,64,power_law_1.01,0.45613441467285154
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,7168,2048,8,384,2,64,power_law_1.01,0.1910272002220154
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,7168,2048,8,384,2,64,balanced,0.08224533498287201
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,7168,2048,8,384,2,64,balanced,0.36978665987650555
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,7168,2048,8,384,2,64,power_law_1.01,0.07320320010185241
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,7168,2048,8,384,2,64,power_law_1.01,0.46594557762145994
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,7168,2048,8,384,2,64,power_law_1.01,0.22337279319763184
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,7168,2048,8,384,2,64,balanced,0.08330666522185008
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,7168,2048,8,384,2,64,power_law_1.01,0.07170559763908387
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,7168,2048,8,384,2,64,power_law_1.01,0.48755202293395994
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,7168,2048,8,384,2,64,power_law_1.01,0.2474047899246216
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,7168,2048,8,384,2,64,balanced,0.08405333757400513
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,7168,2048,8,384,2,64,power_law_1.01,0.058323198556900026
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,7168,2048,8,384,2,64,balanced,0.39257065455118817
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,7168,2048,8,384,2,64,balanced,1.2308106422424316
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,7168,2048,8,384,2,64,power_law_1.01,0.0648576021194458
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,7168,2048,8,384,2,64,balanced,0.09082133571306865
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,7168,2048,8,384,2,64,power_law_1.01,0.2494976043701172
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,7168,2048,8,384,2,64,power_law_1.01,0.451910400390625
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,7168,2048,8,384,2,64,power_law_1.01,0.06995840072631836
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,7168,2048,8,384,2,64,balanced,0.09175999959309895
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,7168,2048,8,384,2,64,power_law_1.01,0.27204480171203616
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,7168,2048,8,384,2,64,power_law_1.01,0.5153920173645019
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,7168,2048,8,384,2,64,power_law_1.01,0.06912000179290771
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,7168,2048,8,384,2,64,balanced,0.09553600351015727
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,7168,2048,8,384,2,64,power_law_1.01,0.28615679740905764
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,7168,2048,8,384,2,64,power_law_1.01,0.07747200131416321
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,7168,2048,8,384,2,64,power_law_1.01,0.47231359481811525
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,7168,2048,8,384,2,64,balanced,0.4140533208847046
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,7168,2048,8,384,2,64,power_law_1.01,0.07638400197029113
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,7168,2048,8,384,2,64,balanced,0.10513066252072652
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,7168,2048,8,384,2,64,power_law_1.01,0.2764159917831421
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,7168,2048,8,384,2,64,power_law_1.01,0.48321919441223143
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,7168,2048,8,384,2,64,power_law_1.01,0.07704960107803345
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,7168,2048,8,384,2,64,power_law_1.01,0.29153919219970703
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,7168,2048,8,384,2,64,power_law_1.01,0.48212480545043945
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,7168,2048,8,384,2,64,power_law_1.01,0.07836160063743591
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,7168,2048,8,384,2,64,power_law_1.01,0.27457919120788576
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,7168,2048,8,384,2,64,power_law_1.01,0.08131840229034423
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,7168,2048,8,384,2,64,power_law_1.01,0.42106242179870607
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,7168,2048,8,384,2,64,power_law_1.01,0.08637440204620361
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,7168,2048,8,384,2,64,balanced,0.71943465868632
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,7168,2048,8,384,2,64,power_law_1.01,0.2637439966201782
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,7168,2048,8,384,2,64,power_law_1.01,0.466809606552124
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,7168,2048,8,384,2,64,power_law_1.01,0.08849279880523682
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,384,2,64,balanced,0.11572800079981486
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,7168,2048,8,384,2,64,power_law_1.01,0.3026432037353516
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,7168,2048,8,384,2,64,balanced,1.6754666964213054
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,7168,2048,8,384,2,64,power_law_1.01,0.513478422164917
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,7168,2048,8,384,2,64,power_law_1.01,0.10343040227890014
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,7168,2048,8,384,2,64,power_law_1.01,0.10628479719161987
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,7168,2048,8,384,2,64,power_law_1.01,0.2896064043045044
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,7168,2048,8,384,2,64,power_law_1.01,0.606169605255127
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,7168,2048,8,384,2,64,power_law_1.01,0.11111680269241334
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,7168,2048,8,384,2,64,power_law_1.01,0.274015998840332
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,7168,2048,8,384,2,64,power_law_1.01,0.7389567852020263
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,7168,2048,8,384,2,64,power_law_1.01,0.1353983998298645
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,7168,2048,8,384,2,64,power_law_1.01,0.2853503942489624
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,7168,2048,8,384,2,64,power_law_1.01,0.8736384391784668
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,7168,2048,8,384,2,64,balanced,0.7590239842732748
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,7168,2048,8,384,2,64,power_law_1.01,0.2804863929748535
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,384,2,64,power_law_1.01,0.16046080589294434
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,7168,2048,8,384,2,64,power_law_1.01,1.283743953704834
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,7168,2048,8,384,2,64,power_law_1.2,0.522976016998291
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,384,2,64,balanced,0.1376106639703115
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,7168,2048,8,384,2,64,power_law_1.01,0.34961280822753904
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,7168,2048,8,384,2,64,power_law_1.01,1.4352191925048827
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,7168,2048,8,384,2,64,power_law_1.2,0.5095551967620849
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,7168,2048,8,384,2,64,power_law_1.01,0.3988991975784302
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,384,2,64,power_law_1.01,0.17307519912719727
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,384,2,64,balanced,0.1536853313446045
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,7168,2048,8,384,2,64,power_law_1.01,2.0969024658203126
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,7168,2048,8,384,2,64,power_law_1.2,0.5221951961517334
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,7168,2048,8,384,2,64,power_law_1.01,0.48263039588928225
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,384,2,64,power_law_1.01,0.20495998859405518
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,7168,2048,8,384,2,64,power_law_1.2,0.2495743989944458
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,7168,2048,8,384,2,64,power_law_1.01,0.6126976013183594
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,7168,2048,8,384,2,64,power_law_1.01,2.6207231521606444
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,384,2,64,power_law_1.01,0.2815615892410278
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,384,2,64,balanced,0.18567466735839844
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,7168,2048,8,384,2,64,power_law_1.2,0.28300158977508544
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,7168,2048,8,384,2,64,power_law_1.01,0.8029567718505859
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,7168,2048,8,384,2,64,power_law_1.01,3.3098304748535154
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,7168,2048,8,384,2,64,balanced,1.1006240049997966
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,7168,2048,8,384,2,64,power_law_1.2,0.4129216194152832
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,7168,2048,8,384,2,64,power_law_1.01,1.1074496269226075
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,7168,2048,8,384,2,64,power_law_1.2,0.29650559425354006
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,7168,2048,8,384,2,64,balanced,2.411306699117025
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,7168,2048,8,384,2,64,power_law_1.01,5.676287841796875
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,7168,2048,8,384,2,64,power_law_1.01,1.5651968002319336
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,7168,2048,8,384,2,64,power_law_1.2,0.4291327953338623
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,7168,2048,8,384,2,64,power_law_1.01,1.9311103820800781
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,7168,2048,8,384,2,64,power_law_1.2,0.3869119882583618
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,7168,2048,8,384,2,64,power_law_1.01,11.734854125976563
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,384,2,64,power_law_1.01,0.3172287940979004
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,384,2,64,balanced,0.22495466470718384
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,7168,2048,8,384,2,64,power_law_1.01,2.4114688873291015
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,7168,2048,8,384,2,64,power_law_1.2,0.46367998123168946
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,384,2,64,power_law_1.01,0.4820608139038086
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,7168,2048,8,384,2,64,power_law_1.2,0.43451519012451173
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,384,2,64,power_law_1.01,0.6289599895477295
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,7168,2048,8,384,2,64,power_law_1.01,3.626995086669922
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,384,2,64,power_law_1.01,0.958944034576416
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,7168,2048,8,384,2,64,power_law_1.2,0.47674241065979006
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,384,2,64,balanced,0.2874773343404134
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,384,2,64,power_law_1.01,1.2254847526550292
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,7168,2048,8,384,2,64,power_law_1.01,7.109196472167969
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,7168,2048,8,384,2,64,power_law_1.2,0.43848319053649903
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,7168,2048,8,384,2,64,balanced,1.441381295522054
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,7168,2048,8,384,2,64,power_law_1.2,0.41726078987121584
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,7168,2048,8,384,2,64,power_law_1.2,0.4985407829284668
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,384,2,64,balanced,0.3801066478093465
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,384,2,64,power_law_1.01,1.569702434539795
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,7168,2048,8,384,2,64,power_law_1.2,0.46743040084838866
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,7168,2048,8,384,2,64,power_law_1.2,0.4020671844482422
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,7168,2048,8,384,2,64,power_law_1.2,0.48250880241394045
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,384,2,64,power_law_1.01,2.250265693664551
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,7168,2048,8,384,2,64,power_law_1.2,0.5365632057189942
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,384,2,64,balanced,0.5198293526967367
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,7168,2048,8,384,2,64,power_law_1.2,0.6440383911132812
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,384,2,64,power_law_1.01,4.4190528869628904
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,7168,2048,8,384,2,64,power_law_1.2,0.7113344192504882
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,7168,2048,8,384,2,64,power_law_1.2,0.915839958190918
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,7168,2048,8,384,2,64,power_law_1.2,1.049516773223877
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,7168,2048,8,384,2,64,balanced,2.1590612729390464
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,7168,2048,8,384,2,64,power_law_1.2,1.4041919708251953
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,7168,2048,8,384,2,64,power_law_1.2,1.7397504806518556
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,384,2,64,balanced,0.6972106297810873
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,7168,2048,8,384,2,64,power_law_1.2,2.8297727584838865
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,7168,2048,8,384,2,64,balanced,4.243904113769531
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,7168,2048,8,384,2,64,power_law_1.2,3.3673473358154298
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,7168,2048,8,384,2,64,power_law_1.2,4.063148880004883
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,7168,2048,8,384,2,64,power_law_1.2,8.192403411865234
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,7168,2048,8,384,2,64,power_law_1.2,0.3086719989776611
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,7168,2048,8,384,2,64,power_law_1.2,0.3029887914657593
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,7168,2048,8,384,2,64,power_law_1.2,17.69366455078125
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,7168,2048,8,384,2,64,power_law_1.2,0.27825920581817626
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,7168,2048,8,384,2,64,power_law_1.2,0.135481595993042
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,384,2,64,balanced,0.8592906792958578
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,7168,2048,8,384,2,64,power_law_1.2,0.18097280263900756
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,7168,2048,8,384,2,64,power_law_1.2,0.22761600017547606
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,7168,2048,8,384,2,64,power_law_1.2,0.21056640148162842
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,7168,2048,8,384,2,64,power_law_1.2,0.24365439414978027
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,7168,2048,8,384,2,64,power_law_1.2,0.26512000560760496
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,7168,2048,8,384,2,64,power_law_1.2,0.2307136058807373
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,7168,2048,8,384,2,64,power_law_1.2,0.2432192087173462
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,7168,2048,8,384,2,64,power_law_1.2,0.28538239002227783
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,7168,2048,8,384,2,64,power_law_1.2,0.2822335958480835
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,7168,2048,8,384,2,64,power_law_1.2,0.2598016023635864
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,7168,2048,8,384,2,64,power_law_1.2,0.2517695903778076
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,7168,2048,8,384,2,64,power_law_1.2,0.2632256031036377
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,7168,2048,8,384,2,64,power_law_1.2,0.2831295967102051
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,7168,2048,8,384,2,64,power_law_1.2,0.3030208110809326
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,7168,2048,8,384,2,64,power_law_1.2,0.3051455974578857
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,384,2,64,balanced,1.353493372599284
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,7168,2048,8,384,2,64,balanced,4.053701400756836
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,7168,2048,8,384,2,64,power_law_1.2,0.4299647808074951
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,7168,2048,8,384,2,64,power_law_1.2,0.4499199867248535
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,7168,2048,8,384,2,64,power_law_1.2,0.6019775867462158
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,7168,2048,8,384,2,64,power_law_1.2,0.6914303779602051
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,7168,2048,8,384,2,64,power_law_1.2,1.054361629486084
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,7168,2048,8,384,2,64,power_law_1.2,1.3222271919250488
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,7168,2048,8,384,2,64,power_law_1.2,1.8687936782836914
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,7168,2048,8,384,2,64,power_law_1.2,2.462419128417969
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,7168,2048,8,384,2,64,power_law_1.2,3.2082942962646483
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,7168,2048,8,384,2,64,power_law_1.2,5.369440078735352
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,7168,2048,8,384,2,64,power_law_1.2,11.497459411621094
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,384,2,64,balanced,2.636122703552246
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,7168,2048,8,384,2,64,power_law_1.2,0.07856640219688416
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,7168,2048,8,384,2,64,power_law_1.2,0.07378559708595275
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,7168,2048,8,384,4,32,balanced,0.08803199728329976
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,7168,2048,8,384,2,64,power_law_1.2,0.07155839800834655
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,7168,2048,8,384,4,32,balanced,0.08557867010434468
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,7168,2048,8,384,2,64,power_law_1.2,0.058156800270080564
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,7168,2048,8,384,4,32,balanced,0.08684266606966655
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,7168,2048,8,384,2,64,power_law_1.2,0.06104320287704468
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,7168,2048,8,384,4,32,balanced,0.11931199828783672
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,7168,2048,8,384,2,64,power_law_1.2,0.06940159797668458
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,7168,2048,8,384,4,32,balanced,0.20368534326553345
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,7168,2048,8,384,2,64,power_law_1.2,0.06812160015106201
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,7168,2048,8,384,4,32,balanced,0.35280001163482666
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,7168,2048,8,384,2,64,power_law_1.2,0.07701759934425353
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,7168,2048,8,384,4,32,balanced,0.5100906689961752
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,7168,2048,8,384,4,32,balanced,0.06578133503595988
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,7168,2048,8,384,2,64,power_law_1.2,0.07637760043144226
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,7168,2048,8,384,4,32,balanced,0.5221920013427734
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,7168,2048,8,384,2,64,power_law_1.2,0.07816960215568543
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,7168,2048,8,384,4,32,balanced,0.06243733565012614
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,7168,2048,8,384,4,32,balanced,0.5199840068817139
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,7168,2048,8,384,4,32,balanced,0.0728000005086263
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,7168,2048,8,384,2,64,power_law_1.2,0.08095999956130981
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,7168,2048,8,384,4,32,balanced,0.5369333426157633
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,7168,2048,8,384,4,32,balanced,0.0825493335723877
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,7168,2048,8,384,2,64,power_law_1.2,0.08271999955177307
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,7168,2048,8,384,4,32,balanced,0.5348000129063925
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,7168,2048,8,384,4,32,balanced,0.13014933466911316
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,7168,2048,8,384,4,32,balanced,0.5141919851303101
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,7168,2048,8,384,2,64,power_law_1.2,0.08372480273246766
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,7168,2048,8,384,4,32,balanced,0.21727466583251953
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,7168,2048,8,384,4,32,balanced,0.5235679944356283
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,7168,2048,8,384,2,64,power_law_1.2,0.0932416021823883
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,7168,2048,8,384,4,32,balanced,0.3057066599527995
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,7168,2048,8,384,4,32,balanced,0.5138773520787557
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,7168,2048,8,384,2,64,power_law_1.2,0.104038405418396
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,7168,2048,8,384,4,32,balanced,0.31193600098292035
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,7168,2048,8,384,4,32,balanced,0.5086986621220907
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,7168,2048,8,384,2,64,power_law_1.2,0.1062656044960022
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,7168,2048,8,384,4,32,balanced,0.2972053289413452
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,7168,2048,8,384,4,32,balanced,0.5143839915593466
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,7168,2048,8,384,2,64,power_law_1.2,0.11340800523757935
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,7168,2048,8,384,4,32,balanced,0.31145066022872925
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,7168,2048,8,384,4,32,balanced,0.47304534912109375
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,7168,2048,8,384,2,64,power_law_1.2,0.1512063980102539
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,7168,2048,8,384,4,32,balanced,0.2997866670290629
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,7168,2048,8,384,4,32,balanced,0.04523199796676636
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,7168,2048,8,384,4,32,balanced,0.5111039876937866
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,7168,2048,8,384,4,32,balanced,0.31143466631571454
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,7168,2048,8,384,4,32,balanced,0.04573333263397217
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,7168,2048,8,384,4,32,balanced,0.3162986636161804
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,384,2,64,power_law_1.2,0.17583359479904176
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,7168,2048,8,384,4,32,balanced,0.5057546695073446
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,7168,2048,8,384,4,32,balanced,0.04586133360862732
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,7168,2048,8,384,4,32,power_law_1.01,0.35674879550933836
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,7168,2048,8,384,4,32,balanced,0.31752532720565796
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,7168,2048,8,384,4,32,balanced,0.5142240126927694
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,7168,2048,8,384,4,32,balanced,0.049695998430252075
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,7168,2048,8,384,4,32,balanced,0.3068266709645589
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,7168,2048,8,384,4,32,power_law_1.01,0.5070464134216308
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,384,2,64,power_law_1.2,0.19839999675750733
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,7168,2048,8,384,4,32,balanced,0.05638400216897329
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,7168,2048,8,384,4,32,balanced,0.3165973424911499
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,7168,2048,8,384,4,32,balanced,0.06894400219122569
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,7168,2048,8,384,4,32,balanced,0.48662400245666504
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,384,2,64,power_law_1.2,0.24197120666503907
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,7168,2048,8,384,4,32,power_law_1.01,0.5462016105651856
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,7168,2048,8,384,4,32,balanced,0.08108266691366832
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,7168,2048,8,384,4,32,balanced,0.3184960087140401
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,384,2,64,power_law_1.2,0.3129535913467407
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,7168,2048,8,384,4,32,power_law_1.01,0.1955839991569519
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,7168,2048,8,384,4,32,balanced,0.08303466439247131
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,7168,2048,8,384,4,32,balanced,0.32266666491826373
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,7168,2048,8,384,4,32,power_law_1.01,0.2790911912918091
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,7168,2048,8,384,4,32,balanced,0.5054826736450195
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,7168,2048,8,384,4,32,balanced,0.08364799618721008
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,7168,2048,8,384,4,32,power_law_1.01,0.31619839668273925
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,7168,2048,8,384,4,32,balanced,0.31036800146102905
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,7168,2048,8,384,4,32,balanced,0.0836906631787618
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,384,2,64,power_law_1.2,0.38419198989868164
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,7168,2048,8,384,4,32,balanced,0.4809173345565796
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,7168,2048,8,384,4,32,power_law_1.01,0.39146239757537843
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,7168,2048,8,384,4,32,balanced,0.08460799853006999
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,384,2,64,power_law_1.2,0.5702271938323975
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,7168,2048,8,384,4,32,balanced,0.3327626585960388
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,7168,2048,8,384,4,32,balanced,0.08620267113049825
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,7168,2048,8,384,4,32,power_law_1.01,0.3998016119003296
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,384,2,64,power_law_1.2,0.8231807708740234
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,7168,2048,8,384,4,32,balanced,0.08803733189900716
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,7168,2048,8,384,4,32,balanced,0.35155733426411945
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,7168,2048,8,384,4,32,power_law_1.01,0.39200639724731445
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,384,2,64,power_law_1.2,1.2110527992248534
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,7168,2048,8,384,4,32,balanced,0.08912000060081482
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,7168,2048,8,384,4,32,balanced,0.42962666352589923
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,7168,2048,8,384,4,32,power_law_1.01,0.4522047996520996
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,7168,2048,8,384,4,32,balanced,0.09545066952705383
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,384,2,64,power_law_1.2,1.7037376403808593
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,7168,2048,8,384,4,32,balanced,0.37907731533050537
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,7168,2048,8,384,4,32,power_law_1.01,0.4525887966156006
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,7168,2048,8,384,4,32,power_law_1.01,0.224236798286438
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,7168,2048,8,384,4,32,balanced,0.09706667065620422
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,7168,2048,8,384,4,32,power_law_1.01,0.5038847923278809
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,7168,2048,8,384,4,32,balanced,0.10149332880973816
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,7168,2048,8,384,4,32,power_law_1.01,0.3228863954544067
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,384,2,64,power_law_1.2,2.026950454711914
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,7168,2048,8,384,4,32,balanced,0.953717311223348
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,7168,2048,8,384,4,32,balanced,0.39236267407735187
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,7168,2048,8,384,4,32,power_law_1.01,0.4166912078857422
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,7168,2048,8,384,4,32,balanced,0.11326932907104492
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,7168,2048,8,384,4,32,power_law_1.01,0.312825608253479
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,7168,2048,8,384,4,32,power_law_1.01,0.431660795211792
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,7168,2048,8,384,4,32,power_law_1.01,0.12448639869689941
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,384,2,64,power_law_1.2,3.8237438201904297
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,7168,2048,8,384,4,32,power_law_1.01,0.4663871765136719
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,7168,2048,8,384,4,32,power_law_1.01,0.14034559726715087
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,7168,2048,8,384,4,32,balanced,0.43729066848754883
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,7168,2048,8,384,4,32,power_law_1.01,0.45172481536865233
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,384,2,64,power_law_1.2,7.862745666503907
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,7168,2048,8,384,4,32,power_law_1.01,0.19987839460372925
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,384,4,32,balanced,0.12526399890581766
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,7168,2048,8,384,4,32,power_law_1.01,0.4493055820465088
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,7168,2048,8,384,4,32,power_law_1.01,0.2386240005493164
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,7168,2048,8,384,4,32,balanced,0.8047733306884766
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,7168,2048,8,384,4,32,power_law_1.01,0.44263038635253904
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,7168,2048,8,384,4,32,power_law_1.01,0.23525118827819824
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,7168,2048,8,384,4,32,balanced,0.7438933054606119
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,7168,2048,8,384,4,32,power_law_1.01,0.2355072021484375
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,7168,2048,8,384,4,32,power_law_1.01,0.5094592094421386
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,7168,2048,8,384,4,32,power_law_1.01,0.2719487905502319
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,7168,2048,8,384,4,32,power_law_1.01,0.5584703922271729
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,7168,2048,8,384,4,32,power_law_1.01,0.2657984018325806
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,7168,2048,8,384,4,32,power_law_1.01,0.604204797744751
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,384,4,32,balanced,0.1479680041472117
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,7168,2048,8,384,4,32,power_law_1.01,0.2761663913726807
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,7168,2048,8,384,4,32,power_law_1.01,0.7146944046020508
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,384,4,32,balanced,0.16856000820795694
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,7168,2048,8,384,4,32,balanced,1.2937013308207195
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,7168,2048,8,384,4,32,balanced,0.8153546651204427
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,7168,2048,8,384,4,32,power_law_1.01,0.27891199588775634
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,7168,2048,8,384,4,32,power_law_1.01,0.8141247749328613
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,7168,2048,8,384,4,32,power_law_1.01,0.2729919910430908
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,384,4,32,balanced,0.2062079906463623
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,7168,2048,8,384,4,32,power_law_1.01,1.066483211517334
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,7168,2048,8,384,4,32,power_law_1.01,0.2685823917388916
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,7168,2048,8,384,4,32,power_law_1.01,1.3722368240356446
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,7168,2048,8,384,4,32,power_law_1.01,0.28894720077514646
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,7168,2048,8,384,4,32,power_law_1.01,0.07185279726982116
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,7168,2048,8,384,4,32,power_law_1.01,1.7588863372802734
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,7168,2048,8,384,4,32,power_law_1.01,0.2837951898574829
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,7168,2048,8,384,4,32,power_law_1.01,2.1701568603515624
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,7168,2048,8,384,4,32,power_law_1.01,0.08026880025863647
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,7168,2048,8,384,4,32,power_law_1.01,0.29462399482727053
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,7168,2048,8,384,4,32,power_law_1.01,0.07652480006217957
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,7168,2048,8,384,4,32,power_law_1.2,0.3537087917327881
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,7168,2048,8,384,4,32,balanced,1.1603466669718425
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,7168,2048,8,384,4,32,power_law_1.01,0.3307775974273682
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,7168,2048,8,384,4,32,power_law_1.01,2.8625471115112306
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,384,4,32,balanced,0.2513759930928548
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,7168,2048,8,384,4,32,power_law_1.01,0.05744640231132507
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,7168,2048,8,384,4,32,power_law_1.01,0.3508095979690552
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,7168,2048,8,384,4,32,power_law_1.2,0.505785608291626
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,7168,2048,8,384,4,32,balanced,1.7376480102539062
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,7168,2048,8,384,4,32,power_law_1.01,4.7384193420410154
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,7168,2048,8,384,4,32,power_law_1.01,0.06139519810676575
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,7168,2048,8,384,4,32,power_law_1.01,0.4161983966827393
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,7168,2048,8,384,4,32,power_law_1.2,0.4192255973815918
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,7168,2048,8,384,4,32,power_law_1.01,0.06561279892921448
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,7168,2048,8,384,4,32,power_law_1.2,0.1776703953742981
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,7168,2048,8,384,4,32,power_law_1.01,0.4902912139892578
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,7168,2048,8,384,4,32,power_law_1.01,8.99849624633789
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,384,4,32,balanced,0.3281173308690389
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,7168,2048,8,384,4,32,power_law_1.01,0.06964480280876159
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,7168,2048,8,384,4,32,power_law_1.2,0.24956159591674804
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,7168,2048,8,384,4,32,power_law_1.01,0.6185535907745361
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,7168,2048,8,384,4,32,power_law_1.2,0.32254719734191895
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,7168,2048,8,384,4,32,power_law_1.01,0.07697280049324036
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,7168,2048,8,384,4,32,power_law_1.01,0.7788479804992676
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,7168,2048,8,384,4,32,power_law_1.01,0.07956479787826538
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,7168,2048,8,384,4,32,power_law_1.2,0.33331201076507566
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,7168,2048,8,384,4,32,power_law_1.01,0.9846655845642089
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,7168,2048,8,384,4,32,balanced,1.5148159662882488
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,7168,2048,8,384,4,32,power_law_1.01,0.07815679907798767
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,7168,2048,8,384,4,32,power_law_1.2,0.42152957916259765
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,7168,2048,8,384,4,32,power_law_1.01,1.3654975891113281
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,384,4,32,balanced,0.4533013502756755
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,7168,2048,8,384,4,32,power_law_1.01,0.07938560247421264
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,7168,2048,8,384,4,32,power_law_1.2,0.4042623996734619
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,7168,2048,8,384,4,32,power_law_1.01,1.673299217224121
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,7168,2048,8,384,4,32,power_law_1.2,0.43108482360839845
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,7168,2048,8,384,4,32,power_law_1.01,0.08394880294799804
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,7168,2048,8,384,4,32,power_law_1.01,2.174995231628418
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,7168,2048,8,384,4,32,power_law_1.2,0.4082816123962402
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,7168,2048,8,384,4,32,power_law_1.01,0.08517119884490967
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,7168,2048,8,384,4,32,power_law_1.2,0.4477375984191895
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,7168,2048,8,384,4,32,power_law_1.01,3.457734298706055
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,7168,2048,8,384,4,32,power_law_1.01,0.09031040072441102
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,7168,2048,8,384,4,32,balanced,2.575541337331136
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,7168,2048,8,384,4,32,power_law_1.2,0.41861758232116697
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,384,4,32,balanced,0.6313440004984537
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,7168,2048,8,384,4,32,power_law_1.01,0.09574400186538697
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,7168,2048,8,384,4,32,power_law_1.2,0.41139841079711914
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,7168,2048,8,384,4,32,power_law_1.01,6.563053131103516
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,7168,2048,8,384,4,32,power_law_1.01,0.10696959495544434
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,7168,2048,8,384,4,32,power_law_1.2,0.46681599617004393
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,7168,2048,8,384,4,32,power_law_1.01,0.1170240044593811
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,7168,2048,8,384,4,32,power_law_1.2,0.4528831958770752
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,7168,2048,8,384,4,32,power_law_1.01,0.13591040372848512
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,7168,2048,8,384,4,32,power_law_1.2,0.43888001441955565
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,7168,2048,8,384,4,32,power_law_1.2,0.48156161308288575
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,7168,2048,8,384,4,32,balanced,2.290010611216227
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,384,4,32,power_law_1.01,0.14871679544448851
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,384,4,32,balanced,0.8418400287628174
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,7168,2048,8,384,4,32,power_law_1.2,0.4791872024536133
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,7168,2048,8,384,4,32,power_law_1.2,0.5656960010528564
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,384,4,32,power_law_1.01,0.18190079927444458
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,7168,2048,8,384,4,32,power_law_1.2,0.6780159950256348
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,384,4,32,power_law_1.01,0.22410240173339843
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,7168,2048,8,384,4,32,power_law_1.2,0.8075391769409179
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,384,4,32,power_law_1.01,0.3080384016036987
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,7168,2048,8,384,4,32,power_law_1.2,0.9665280342102051
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,7168,2048,8,384,4,32,power_law_1.2,1.2550911903381348
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,7168,2048,8,384,4,32,power_law_1.2,1.7670463562011718
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,384,4,32,power_law_1.01,0.38623359203338625
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,384,4,32,balanced,1.0275306701660156
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,7168,2048,8,384,4,32,power_law_1.2,2.391865539550781
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,384,4,32,power_law_1.01,0.5386688232421875
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,7168,2048,8,384,4,32,power_law_1.2,3.248108673095703
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,384,4,32,power_law_1.01,0.6798399925231934
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,7168,2048,8,384,4,32,power_law_1.2,3.5210239410400392
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,384,4,32,power_law_1.01,0.9343999862670899
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,7168,2048,8,384,4,32,power_law_1.2,5.558483123779297
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,384,4,32,power_law_1.01,1.3242560386657716
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,384,4,32,power_law_1.01,1.5805824279785157
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,7168,2048,8,384,4,32,power_law_1.2,13.784614562988281
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,7168,2048,8,384,4,32,balanced,4.54590384165446
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,384,4,32,power_law_1.01,2.4710720062255858
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,384,4,32,power_law_1.01,4.688902282714844
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,384,4,32,balanced,1.6131466229756672
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,7168,2048,8,384,4,32,balanced,4.310256004333496
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,7168,2048,8,384,4,32,power_law_1.2,0.22257280349731445
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,7168,2048,8,384,4,32,power_law_1.2,0.31368958950042725
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,7168,2048,8,384,4,32,power_law_1.2,0.2643712043762207
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,7168,2048,8,384,4,32,power_law_1.2,0.10913920402526855
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,7168,2048,8,384,4,32,power_law_1.2,0.16392960548400878
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,7168,2048,8,384,4,32,power_law_1.2,0.18642560243606568
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,7168,2048,8,384,4,32,power_law_1.2,0.18709759712219237
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,7168,2048,8,384,4,32,power_law_1.2,0.26225919723510743
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,7168,2048,8,384,4,32,power_law_1.2,0.20936961174011232
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,384,4,32,balanced,3.146373430887858
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,7168,2048,8,384,4,32,power_law_1.2,0.23304319381713867
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,7168,2048,8,384,4,32,power_law_1.2,0.2877824068069458
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,7168,2048,8,384,4,32,power_law_1.2,0.2686912059783936
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,7168,2048,8,384,4,32,power_law_1.2,0.24074239730834962
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,7168,2048,8,384,4,32,power_law_1.2,0.26940159797668456
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,7168,2048,8,384,4,32,power_law_1.2,0.23947520256042482
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,7168,2048,8,384,4,32,power_law_1.2,0.27511680126190186
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,7168,2048,8,384,4,32,power_law_1.2,0.2689536094665527
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,7168,2048,8,384,4,32,power_law_1.2,0.3001471996307373
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,7168,2048,8,384,4,32,power_law_1.2,0.3247231960296631
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,7168,2048,8,384,4,32,power_law_1.2,0.38728320598602295
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,7168,2048,8,384,4,32,power_law_1.2,0.07023360133171082
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,7168,2048,8,384,4,32,power_law_1.2,0.4676544189453125
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,7168,2048,8,384,4,32,power_law_1.2,0.08024960160255432
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,7168,2048,8,384,4,32,power_law_1.2,0.5748735904693604
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,7168,2048,8,384,4,32,power_law_1.2,0.056959998607635495
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,7168,2048,8,384,4,32,power_law_1.2,0.6723008155822754
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,7168,2048,8,384,4,32,power_law_1.2,0.0562175989151001
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,7168,2048,8,384,4,32,power_law_1.2,0.9460288047790527
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,7168,2048,8,384,4,32,power_law_1.2,0.060652798414230345
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,7168,2048,8,384,4,32,power_law_1.2,1.1903615951538087
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,7168,2048,8,384,4,32,power_law_1.2,0.06599680185317994
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,7168,2048,8,384,4,32,power_law_1.2,0.06936960220336914
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,7168,2048,8,384,4,32,power_law_1.2,1.7273792266845702
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,7168,2048,8,384,4,32,power_law_1.2,0.07589120268821717
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,7168,2048,8,384,4,32,power_law_1.2,2.0617279052734374
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,7168,2048,8,384,4,32,power_law_1.2,0.0759168028831482
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,7168,2048,8,384,4,32,power_law_1.2,2.719219207763672
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,7168,2048,8,384,8,16,balanced,0.055306668082873024
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,7168,2048,8,384,4,32,power_law_1.2,0.07652480006217957
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,7168,2048,8,384,8,16,balanced,0.05584533512592316
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,7168,2048,8,384,4,32,power_law_1.2,0.07692800164222717
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,7168,2048,8,384,4,32,power_law_1.2,4.02935676574707
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,7168,2048,8,384,8,16,balanced,0.05522666871547699
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,7168,2048,8,384,4,32,power_law_1.2,0.08267520070075988
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,7168,2048,8,384,8,16,balanced,0.06163733204205831
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,7168,2048,8,384,4,32,power_law_1.2,8.154412841796875
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,7168,2048,8,384,4,32,power_law_1.2,0.08257279992103576
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,7168,2048,8,384,8,16,balanced,0.072202667593956
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,7168,2048,8,384,8,16,balanced,0.09053333600362141
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,7168,2048,8,384,4,32,power_law_1.2,0.08711680173873901
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,7168,2048,8,384,8,16,balanced,0.11238400141398112
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,7168,2048,8,384,4,32,power_law_1.2,0.10554879903793335
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,7168,2048,8,384,8,16,balanced,0.11506666739781697
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,7168,2048,8,384,8,16,balanced,0.11430933078130086
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,7168,2048,8,384,4,32,power_law_1.2,0.10905599594116211
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,7168,2048,8,384,8,16,balanced,0.11372266213099162
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,7168,2048,8,384,4,32,power_law_1.2,0.12847360372543334
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,7168,2048,8,384,8,16,balanced,0.11617066462834676
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,7168,2048,8,384,4,32,power_law_1.2,0.15944960117340087
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,7168,2048,8,384,8,16,balanced,0.1179146667321523
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,7168,2048,8,384,8,16,balanced,0.11821333567301433
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,384,4,32,power_law_1.2,0.15964800119400024
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,7168,2048,8,384,8,16,balanced,0.12045333782831828
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,7168,2048,8,384,8,16,balanced,0.12613866726557413
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,7168,2048,8,384,8,16,balanced,0.12804800271987915
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,384,4,32,power_law_1.2,0.18835840225219727
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,7168,2048,8,384,8,16,balanced,0.1311253309249878
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,384,4,32,power_law_1.2,0.24576640129089355
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,7168,2048,8,384,8,16,balanced,0.14175466696421304
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,7168,2048,8,384,8,16,balanced,0.15051199992497763
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,384,4,32,power_law_1.2,0.3449343919754028
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,7168,2048,8,384,8,16,balanced,0.17058134078979492
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,384,4,32,power_law_1.2,0.44261760711669923
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,7168,2048,8,384,8,16,balanced,0.1926400065422058
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,7168,2048,8,384,8,16,balanced,0.04762666424115499
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,384,4,32,power_law_1.2,0.6235072135925293
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,7168,2048,8,384,8,16,balanced,0.048725331823031105
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,7168,2048,8,384,8,16,balanced,0.048570667703946434
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,7168,2048,8,384,8,16,balanced,0.2307200034459432
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,7168,2048,8,384,8,16,balanced,0.05420800050099691
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,384,4,32,power_law_1.2,0.7739136219024658
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,7168,2048,8,384,8,16,balanced,0.059845333298047386
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,384,4,32,power_law_1.2,1.1828927993774414
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,7168,2048,8,384,8,16,balanced,0.07387733459472656
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,7168,2048,8,384,8,16,balanced,0.2682346701622009
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,7168,2048,8,384,8,16,balanced,0.08753599723180135
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,384,4,32,power_law_1.2,1.6433408737182618
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,7168,2048,8,384,8,16,balanced,0.0883893370628357
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,7168,2048,8,384,8,16,balanced,0.0893440047899882
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,384,4,32,power_law_1.2,1.9832576751708983
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,7168,2048,8,384,8,16,balanced,0.046800002455711365
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,7168,2048,8,384,8,16,balanced,0.09038399656613667
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,7168,2048,8,384,8,16,balanced,0.32578132549921673
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,7168,2048,8,384,8,16,power_law_1.01,0.07927680015563965
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,7168,2048,8,384,8,16,balanced,0.047685335079828896
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,7168,2048,8,384,8,16,balanced,0.09171199798583984
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,7168,2048,8,384,8,16,power_law_1.01,0.08769919872283935
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,384,4,32,power_law_1.2,3.364217758178711
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,7168,2048,8,384,8,16,balanced,0.09377599755922954
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,7168,2048,8,384,8,16,balanced,0.049141332507133484
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,7168,2048,8,384,8,16,power_law_1.01,0.06602240204811097
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,7168,2048,8,384,8,16,power_law_1.01,0.10241279602050782
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,7168,2048,8,384,8,16,balanced,0.09616532921791077
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,7168,2048,8,384,8,16,balanced,0.054229333996772766
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,7168,2048,8,384,8,16,power_law_1.01,0.0689087986946106
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,7168,2048,8,384,8,16,power_law_1.01,0.06704639792442321
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,7168,2048,8,384,8,16,balanced,0.41606398423512775
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,384,4,32,power_law_1.2,7.389177703857422
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,7168,2048,8,384,8,16,balanced,0.061664000153541565
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,7168,2048,8,384,8,16,balanced,0.09752532839775085
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,7168,2048,8,384,8,16,power_law_1.01,0.07886080145835876
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,7168,2048,8,384,8,16,power_law_1.01,0.07082880139350892
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,7168,2048,8,384,8,16,balanced,0.07396266857783
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,7168,2048,8,384,8,16,balanced,0.103685329357783
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,7168,2048,8,384,8,16,power_law_1.01,0.08081920146942138
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,7168,2048,8,384,8,16,power_law_1.01,0.057062399387359616
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,7168,2048,8,384,8,16,balanced,0.08944533268610637
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,7168,2048,8,384,8,16,balanced,0.10619200269381206
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,7168,2048,8,384,8,16,power_law_1.01,0.0855296015739441
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,7168,2048,8,384,8,16,balanced,0.09090133508046468
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,7168,2048,8,384,8,16,power_law_1.01,0.062009602785110474
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,7168,2048,8,384,8,16,balanced,0.11104533076286316
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,7168,2048,8,384,8,16,balanced,0.0916319986184438
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,7168,2048,8,384,8,16,power_law_1.01,0.09310719966888428
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,7168,2048,8,384,8,16,power_law_1.01,0.06706560254096985
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,7168,2048,8,384,8,16,balanced,0.12450133760770161
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,7168,2048,8,384,8,16,balanced,0.5531839927037557
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,7168,2048,8,384,8,16,balanced,0.091648002465566
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,7168,2048,8,384,8,16,power_law_1.01,0.09816319942474365
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,7168,2048,8,384,8,16,power_law_1.01,0.06993920207023621
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,7168,2048,8,384,8,16,balanced,0.13740266362826029
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,7168,2048,8,384,8,16,balanced,0.0937493344148
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,7168,2048,8,384,8,16,power_law_1.01,0.09938560128211975
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,7168,2048,8,384,8,16,power_law_1.01,0.07749119997024537
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,7168,2048,8,384,8,16,balanced,0.16332266728083292
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,7168,2048,8,384,8,16,balanced,0.09549867113431294
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,7168,2048,8,384,8,16,power_law_1.01,0.10153599977493286
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,7168,2048,8,384,8,16,power_law_1.01,0.07836160063743591
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,7168,2048,8,384,8,16,balanced,0.09736532966295879
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,7168,2048,8,384,8,16,power_law_1.01,0.10514559745788574
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,7168,2048,8,384,8,16,balanced,0.19113600254058838
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,7168,2048,8,384,8,16,power_law_1.01,0.07939199805259704
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,7168,2048,8,384,8,16,balanced,0.0995306670665741
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,7168,2048,8,384,8,16,power_law_1.01,0.10117759704589843
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,7168,2048,8,384,8,16,power_law_1.01,0.08234239816665649
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,7168,2048,8,384,8,16,balanced,0.10600533088048299
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,7168,2048,8,384,8,16,power_law_1.01,0.10911999940872193
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,7168,2048,8,384,8,16,balanced,0.24030399322509766
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,7168,2048,8,384,8,16,power_law_1.01,0.08381440043449402
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,7168,2048,8,384,8,16,balanced,0.7392000357309977
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,7168,2048,8,384,8,16,balanced,0.10884799559911092
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,7168,2048,8,384,8,16,power_law_1.01,0.1173632025718689
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,7168,2048,8,384,8,16,power_law_1.01,0.08509439826011658
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,7168,2048,8,384,8,16,balanced,0.11522666613260905
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,7168,2048,8,384,8,16,power_law_1.01,0.11967999935150146
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,7168,2048,8,384,8,16,balanced,0.2858293255170186
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,7168,2048,8,384,8,16,power_law_1.01,0.09091839790344239
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,7168,2048,8,384,8,16,power_law_1.01,0.12833280563354493
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,7168,2048,8,384,8,16,balanced,0.1288586656252543
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,7168,2048,8,384,8,16,power_law_1.01,0.10021760463714599
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,7168,2048,8,384,8,16,power_law_1.01,0.14284160137176513
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,7168,2048,8,384,8,16,balanced,0.3773599863052368
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,7168,2048,8,384,8,16,power_law_1.01,0.10417280197143555
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,7168,2048,8,384,8,16,power_law_1.01,0.1585088014602661
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,7168,2048,8,384,8,16,power_law_1.01,0.20655360221862792
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,7168,2048,8,384,8,16,power_law_1.01,0.11247999668121338
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,7168,2048,8,384,8,16,power_law_1.01,0.06370559930801392
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,384,8,16,balanced,0.1471946636835734
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,7168,2048,8,384,8,16,power_law_1.01,0.13238400220870972
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,7168,2048,8,384,8,16,power_law_1.01,0.23342719078063964
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,7168,2048,8,384,8,16,power_law_1.01,0.0762880027294159
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,7168,2048,8,384,8,16,power_law_1.01,0.2684288024902344
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,7168,2048,8,384,8,16,power_law_1.01,0.15267839431762695
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,7168,2048,8,384,8,16,power_law_1.01,0.08822399973869324
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,7168,2048,8,384,8,16,balanced,0.9168639977773031
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,7168,2048,8,384,8,16,balanced,0.4846133391062419
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,7168,2048,8,384,8,16,power_law_1.01,0.3475519895553589
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,7168,2048,8,384,8,16,power_law_1.01,0.1862015962600708
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,7168,2048,8,384,8,16,power_law_1.01,0.05807999968528747
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,7168,2048,8,384,8,16,power_law_1.01,0.06544640064239501
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,7168,2048,8,384,8,16,power_law_1.01,0.42508797645568847
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,7168,2048,8,384,8,16,power_law_1.01,0.21479039192199706
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,7168,2048,8,384,8,16,power_law_1.01,0.06999679803848266
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,7168,2048,8,384,8,16,power_law_1.01,0.5362751960754395
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,7168,2048,8,384,8,16,power_law_1.01,0.27450881004333494
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,7168,2048,8,384,8,16,power_law_1.01,0.0735871970653534
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,384,8,16,balanced,0.1759200096130371
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,7168,2048,8,384,8,16,power_law_1.01,0.744268798828125
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,7168,2048,8,384,8,16,power_law_1.01,0.33740160465240476
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,7168,2048,8,384,8,16,power_law_1.01,0.08058879971504211
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,7168,2048,8,384,8,16,power_law_1.01,0.4383103847503662
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,7168,2048,8,384,8,16,power_law_1.01,0.08069760203361512
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,7168,2048,8,384,8,16,power_law_1.01,0.9573375701904296
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,384,8,16,balanced,0.20232532421747842
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,7168,2048,8,384,8,16,power_law_1.01,0.08327040076255798
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,7168,2048,8,384,8,16,balanced,0.6790826320648193
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,7168,2048,8,384,8,16,power_law_1.01,0.5898623943328858
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,7168,2048,8,384,8,16,power_law_1.01,1.2229567527770997
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,7168,2048,8,384,8,16,power_law_1.01,0.08734080195426941
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,7168,2048,8,384,8,16,power_law_1.01,0.7819968223571777
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,384,8,16,balanced,0.2510880033175151
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,7168,2048,8,384,8,16,power_law_1.01,0.09157119989395142
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,7168,2048,8,384,8,16,power_law_1.01,1.8519424438476562
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,7168,2048,8,384,8,16,power_law_1.01,1.0423808097839355
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,7168,2048,8,384,8,16,power_law_1.01,0.09064319729804993
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,7168,2048,8,384,8,16,power_law_1.01,0.10161919593811035
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,7168,2048,8,384,8,16,power_law_1.01,3.265625762939453
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,7168,2048,8,384,8,16,power_law_1.01,1.2758336067199707
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,7168,2048,8,384,8,16,power_law_1.01,0.10968320369720459
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,7168,2048,8,384,8,16,power_law_1.01,0.11477760076522828
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,7168,2048,8,384,8,16,power_law_1.01,1.952390480041504
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,7168,2048,8,384,8,16,power_law_1.01,0.13570560216903688
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,7168,2048,8,384,8,16,balanced,1.347376028696696
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,7168,2048,8,384,8,16,power_law_1.01,0.16209280490875244
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,7168,2048,8,384,8,16,power_law_1.01,3.9652481079101562
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,7168,2048,8,384,8,16,balanced,0.890725294748942
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,384,8,16,balanced,0.3244853417078654
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,384,8,16,power_law_1.01,0.18263039588928223
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,384,8,16,balanced,0.4395466645558675
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,384,8,16,power_law_1.01,0.2156735897064209
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,384,8,16,power_law_1.01,0.2542207956314087
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,384,8,16,power_law_1.01,0.36241281032562256
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,384,8,16,balanced,0.6107893387476603
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,7168,2048,8,384,8,16,balanced,1.0994773705800374
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,384,8,16,power_law_1.01,0.42189440727233884
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,7168,2048,8,384,8,16,power_law_1.2,0.07823359966278076
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,384,8,16,power_law_1.01,0.6225152015686035
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,7168,2048,8,384,8,16,power_law_1.2,0.08872320055961609
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,384,8,16,power_law_1.01,0.8760128021240234
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,7168,2048,8,384,8,16,power_law_1.2,0.07845759987831116
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,384,8,16,power_law_1.01,1.1713664054870605
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,7168,2048,8,384,8,16,power_law_1.2,0.0664896011352539
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,384,8,16,balanced,0.8391626675923666
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,7168,2048,8,384,8,16,power_law_1.2,0.07071359753608704
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,384,8,16,power_law_1.01,1.5564031600952148
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,7168,2048,8,384,8,16,power_law_1.2,0.0781503975391388
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,384,8,16,power_law_1.01,1.9111551284790038
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,7168,2048,8,384,8,16,power_law_1.2,0.08316799998283386
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,384,8,16,power_law_1.01,3.428435134887695
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,7168,2048,8,384,8,16,power_law_1.2,0.09408000111579895
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,384,8,16,power_law_1.01,6.323769760131836
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,7168,2048,8,384,8,16,power_law_1.2,0.09559680223464966
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,7168,2048,8,384,8,16,power_law_1.2,0.09681280255317688
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,7168,2048,8,384,8,16,power_law_1.2,0.09981439709663391
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,384,8,16,balanced,1.1081653436024983
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,7168,2048,8,384,8,16,power_law_1.2,0.1034816026687622
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,7168,2048,8,384,8,16,balanced,1.6917600631713867
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,7168,2048,8,384,8,16,power_law_1.2,0.10548479557037353
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,7168,2048,8,384,8,16,power_law_1.2,0.10569599866867066
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,7168,2048,8,384,8,16,power_law_1.2,0.11849600076675415
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,7168,2048,8,384,8,16,balanced,2.5300532976786294
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,7168,2048,8,384,8,16,power_law_1.2,0.1202623963356018
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,7168,2048,8,384,8,16,power_law_1.2,0.13139840364456176
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,7168,2048,8,384,8,16,power_law_1.2,0.14914560317993164
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,384,8,16,balanced,1.363200028737386
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,7168,2048,8,384,8,16,power_law_1.2,0.164518404006958
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,7168,2048,8,384,8,16,power_law_1.2,0.21056640148162842
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,7168,2048,8,384,8,16,power_law_1.2,0.23688960075378418
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,7168,2048,8,384,8,16,power_law_1.2,0.2913088083267212
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,7168,2048,8,384,8,16,power_law_1.2,0.37918078899383545
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,7168,2048,8,384,8,16,power_law_1.2,0.5234240055084228
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,7168,2048,8,384,8,16,power_law_1.2,0.5919616222381592
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,7168,2048,8,384,8,16,power_law_1.2,0.06364160180091857
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,7168,2048,8,384,8,16,power_law_1.2,0.7599552154541016
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,7168,2048,8,384,8,16,power_law_1.2,0.0747327983379364
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,7168,2048,8,384,8,16,power_law_1.2,1.180128002166748
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,7168,2048,8,384,8,16,power_law_1.2,0.06691200137138367
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,7168,2048,8,384,8,16,power_law_1.2,1.3412480354309082
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,7168,2048,8,384,8,16,power_law_1.2,0.05631359815597534
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,7168,2048,8,384,8,16,power_law_1.2,0.06098560094833374
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,384,8,16,balanced,2.133375962575277
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,7168,2048,8,384,8,16,power_law_1.2,2.3781951904296874
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,7168,2048,8,384,8,16,power_law_1.2,0.06534399986267089
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,7168,2048,8,384,8,16,power_law_1.2,0.07046399712562561
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,7168,2048,8,384,8,16,power_law_1.2,0.07418879866600037
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,7168,2048,8,384,8,16,power_law_1.2,4.176403045654297
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,7168,2048,8,384,8,16,power_law_1.2,0.07777919769287109
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,7168,2048,8,384,8,16,balanced,3.2560160954793296
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,7168,2048,8,384,8,16,power_law_1.2,0.078438401222229
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,7168,2048,8,384,8,16,power_law_1.2,0.08122239708900451
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,7168,2048,8,384,8,16,power_law_1.2,0.08583679795265198
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,7168,2048,8,384,8,16,power_law_1.2,0.08715519905090333
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,7168,2048,8,384,8,16,power_law_1.2,0.09228799939155578
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,7168,2048,8,384,8,16,power_law_1.2,0.10057599544525146
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,7168,2048,8,384,8,16,power_law_1.2,0.1102720022201538
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,7168,2048,8,384,8,16,power_law_1.2,0.11349120140075683
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,7168,2048,8,384,8,16,power_law_1.2,0.1325503945350647
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,7168,2048,8,384,8,16,power_law_1.2,0.15790079832077025
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,7168,2048,8,384,8,16,power_law_1.2,0.19867520332336425
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,7168,2048,8,384,8,16,power_law_1.2,0.2251584053039551
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,7168,2048,8,384,8,16,power_law_1.2,0.2961344003677368
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,7168,2048,8,384,8,16,power_law_1.2,0.343667197227478
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,7168,2048,8,384,8,16,power_law_1.2,0.48496642112731936
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,7168,2048,8,384,8,16,power_law_1.2,0.6239552021026611
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,7168,2048,8,384,8,16,power_law_1.2,0.8766207695007324
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,7168,2048,8,384,8,16,power_law_1.2,1.159596824645996
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,7168,2048,8,384,8,16,power_law_1.2,1.4552063941955566
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,7168,2048,8,384,8,16,power_law_1.2,2.430284881591797
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,7168,2048,8,384,8,16,power_law_1.2,4.8083648681640625
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,384,8,16,balanced,4.181722640991211
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,7168,2048,8,384,16,8,balanced,0.05625600119431814
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,7168,2048,8,384,16,8,balanced,0.05560000240802765
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,7168,2048,8,384,8,16,power_law_1.2,0.06244480013847351
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,7168,2048,8,384,16,8,balanced,0.05736533304055532
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,7168,2048,8,384,16,8,balanced,0.06412266691525777
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,7168,2048,8,384,8,16,power_law_1.2,0.07607679963111877
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,7168,2048,8,384,16,8,balanced,0.07549866537253062
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,7168,2048,8,384,8,16,power_law_1.2,0.06417279839515685
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,7168,2048,8,384,16,8,balanced,0.09784533580144246
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,7168,2048,8,384,8,16,power_law_1.2,0.05983359813690185
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,7168,2048,8,384,16,8,balanced,0.12298666437466939
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,7168,2048,8,384,8,16,power_law_1.2,0.06327040195465088
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,7168,2048,8,384,16,8,balanced,0.12352533141771953
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,7168,2048,8,384,16,8,balanced,0.12314666310946147
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,7168,2048,8,384,8,16,power_law_1.2,0.07041919827461243
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,7168,2048,8,384,16,8,balanced,0.12545067071914673
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,7168,2048,8,384,8,16,power_law_1.2,0.07544320225715637
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,7168,2048,8,384,16,8,balanced,0.12763733665148416
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,7168,2048,8,384,8,16,power_law_1.2,0.08204159736633301
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,7168,2048,8,384,16,8,balanced,0.1286186675230662
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,7168,2048,8,384,8,16,power_law_1.2,0.08387839794158936
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,7168,2048,8,384,16,8,balanced,0.12894933422406515
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,7168,2048,8,384,8,16,power_law_1.2,0.08282880187034607
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,7168,2048,8,384,16,8,balanced,0.13236799836158752
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,7168,2048,8,384,16,8,balanced,0.14006933569908142
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,7168,2048,8,384,8,16,power_law_1.2,0.08501759767532349
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,7168,2048,8,384,8,16,power_law_1.2,0.09509119987487794
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,7168,2048,8,384,16,8,balanced,0.14177067081133524
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,7168,2048,8,384,8,16,power_law_1.2,0.0941760003566742
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,7168,2048,8,384,16,8,balanced,0.1467680037021637
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,7168,2048,8,384,8,16,power_law_1.2,0.10005760192871094
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,7168,2048,8,384,16,8,balanced,0.1602773368358612
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,7168,2048,8,384,16,8,balanced,0.0481279989083608
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,7168,2048,8,384,8,16,power_law_1.2,0.1119871973991394
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,7168,2048,8,384,16,8,balanced,0.17170133193333945
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,7168,2048,8,384,16,8,balanced,0.04913066824277242
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,7168,2048,8,384,8,16,power_law_1.2,0.12579840421676636
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,7168,2048,8,384,16,8,balanced,0.05029866596062978
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,7168,2048,8,384,16,8,balanced,0.19829867283503214
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,7168,2048,8,384,8,16,power_law_1.2,0.13504639863967896
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,7168,2048,8,384,16,8,balanced,0.05570133527119955
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,7168,2048,8,384,16,8,balanced,0.06447466711203258
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,7168,2048,8,384,8,16,power_law_1.2,0.17761919498443604
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,7168,2048,8,384,16,8,balanced,0.22141865889231363
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,7168,2048,8,384,16,8,balanced,0.08276799817879994
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,7168,2048,8,384,16,8,balanced,0.09809066851933797
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,7168,2048,8,384,16,8,balanced,0.259770671526591
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,384,8,16,power_law_1.2,0.18664319515228273
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,7168,2048,8,384,16,8,balanced,0.09992532928784688
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,7168,2048,8,384,16,8,balanced,0.10010666648546855
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,7168,2048,8,384,16,8,balanced,0.10125866532325745
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,7168,2048,8,384,16,8,balanced,0.30762133995691937
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,7168,2048,8,384,16,8,balanced,0.10386133193969727
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,384,8,16,power_law_1.2,0.21497600078582763
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,7168,2048,8,384,16,8,balanced,0.10486400127410889
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,384,8,16,power_law_1.2,0.2815295934677124
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,7168,2048,8,384,16,8,balanced,0.10705066720644633
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,384,8,16,power_law_1.2,0.39590399265289306
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,7168,2048,8,384,16,8,balanced,0.10831466317176819
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,7168,2048,8,384,16,8,balanced,0.40135467052459717
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,7168,2048,8,384,16,8,balanced,0.05092266698678335
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,7168,2048,8,384,16,8,balanced,0.11774399876594543
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,7168,2048,8,384,16,8,balanced,0.054570664962132774
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,7168,2048,8,384,16,8,balanced,0.12012799580891927
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,384,8,16,power_law_1.2,0.48126721382141113
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,7168,2048,8,384,16,8,balanced,0.057002668579419456
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,7168,2048,8,384,16,8,balanced,0.12589333454767862
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,384,8,16,power_law_1.2,0.7226687908172608
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,7168,2048,8,384,16,8,balanced,0.06283199787139893
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,7168,2048,8,384,16,8,balanced,0.5153493483861288
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,7168,2048,8,384,16,8,balanced,0.14332800110181174
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,7168,2048,8,384,16,8,balanced,0.07320000231266022
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,384,8,16,power_law_1.2,0.9563839912414551
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,7168,2048,8,384,16,8,balanced,0.08989866574605306
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,7168,2048,8,384,16,8,balanced,0.1593546668688456
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,384,8,16,power_law_1.2,1.4231488227844238
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,7168,2048,8,384,16,8,balanced,0.1070186694463094
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,7168,2048,8,384,16,8,balanced,0.10820800065994263
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,7168,2048,8,384,16,8,balanced,0.18872000773747763
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,384,8,16,power_law_1.2,1.7214080810546875
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,7168,2048,8,384,16,8,balanced,0.11036266883214314
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,7168,2048,8,384,16,8,balanced,0.11145599683125813
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,384,8,16,power_law_1.2,2.1569984436035154
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,7168,2048,8,384,16,8,balanced,0.7061386903127035
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,7168,2048,8,384,16,8,balanced,0.22166933616002402
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,7168,2048,8,384,16,8,balanced,0.11358400185902913
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,384,8,16,power_law_1.2,4.101030349731445
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,7168,2048,8,384,16,8,balanced,0.11580800016721089
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,7168,2048,8,384,16,8,balanced,0.27529066801071167
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,7168,2048,8,384,16,8,balanced,0.11948266625404358
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,7168,2048,8,384,16,8,balanced,0.12266666690508525
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,384,8,16,power_law_1.2,7.624639892578125
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,7168,2048,8,384,16,8,balanced,0.13223466277122498
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,7168,2048,8,384,16,8,balanced,0.33192533254623413
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,7168,2048,8,384,16,8,balanced,0.1355839967727661
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,7168,2048,8,384,16,8,power_law_1.01,0.061382400989532473
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,7168,2048,8,384,16,8,balanced,0.14646933476130167
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,7168,2048,8,384,16,8,balanced,0.9284319877624512
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,7168,2048,8,384,16,8,power_law_1.01,0.07882239818572997
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,7168,2048,8,384,16,8,balanced,0.16366933782895407
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,7168,2048,8,384,16,8,balanced,0.4489920139312744
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,7168,2048,8,384,16,8,power_law_1.01,0.05189120173454285
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,7168,2048,8,384,16,8,power_law_1.01,0.10299520492553711
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,7168,2048,8,384,16,8,power_law_1.01,0.06301440000534057
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,7168,2048,8,384,16,8,power_law_1.01,0.06579840183258057
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,7168,2048,8,384,16,8,power_law_1.01,0.07483519911766053
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,7168,2048,8,384,16,8,power_law_1.01,0.07028480172157288
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,7168,2048,8,384,16,8,balanced,0.5816053152084351
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,7168,2048,8,384,16,8,power_law_1.01,0.05777919888496399
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,7168,2048,8,384,16,8,power_law_1.01,0.08429440259933471
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,384,16,8,balanced,0.1885333259900411
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,7168,2048,8,384,16,8,power_law_1.01,0.06321920156478882
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,7168,2048,8,384,16,8,power_law_1.01,0.08650239706039428
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,7168,2048,8,384,16,8,power_law_1.01,0.09574400186538697
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,7168,2048,8,384,16,8,power_law_1.01,0.06991360187530518
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,7168,2048,8,384,16,8,balanced,1.1261173089345295
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,7168,2048,8,384,16,8,power_law_1.01,0.10088319778442383
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,7168,2048,8,384,16,8,power_law_1.01,0.0749504029750824
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,7168,2048,8,384,16,8,power_law_1.01,0.08432000279426574
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,7168,2048,8,384,16,8,power_law_1.01,0.0998528003692627
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,7168,2048,8,384,16,8,balanced,0.8250880241394043
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,384,16,8,balanced,0.2465440034866333
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,7168,2048,8,384,16,8,power_law_1.01,0.10833280086517334
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,7168,2048,8,384,16,8,power_law_1.01,0.0850495994091034
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,7168,2048,8,384,16,8,power_law_1.01,0.11240960359573364
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,7168,2048,8,384,16,8,power_law_1.01,0.08984320163726807
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,384,16,8,balanced,0.2949120004971822
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,7168,2048,8,384,16,8,power_law_1.01,0.11499520540237426
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,7168,2048,8,384,16,8,power_law_1.01,0.0899839997291565
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,7168,2048,8,384,16,8,power_law_1.01,0.1229248046875
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,7168,2048,8,384,16,8,power_law_1.01,0.0943615972995758
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,384,16,8,balanced,0.37462401390075684
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,7168,2048,8,384,16,8,power_law_1.01,0.09631999731063842
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,7168,2048,8,384,16,8,power_law_1.01,0.1273151993751526
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,7168,2048,8,384,16,8,power_law_1.01,0.10362240076065063
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,7168,2048,8,384,16,8,power_law_1.01,0.13765759468078614
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,384,16,8,balanced,0.49017600218455
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,7168,2048,8,384,16,8,balanced,1.075482686360677
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,7168,2048,8,384,16,8,power_law_1.01,0.11294080018997192
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,7168,2048,8,384,16,8,power_law_1.01,0.13925119638442993
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,7168,2048,8,384,16,8,power_law_1.01,0.06392959952354431
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,7168,2048,8,384,16,8,power_law_1.01,0.12242560386657715
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,7168,2048,8,384,16,8,power_law_1.01,0.16132479906082153
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,7168,2048,8,384,16,8,power_law_1.2,0.061849600076675414
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,7168,2048,8,384,16,8,power_law_1.01,0.1325055956840515
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,7168,2048,8,384,16,8,power_law_1.01,0.18373119831085205
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,384,16,8,balanced,0.6472320159276327
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,7168,2048,8,384,16,8,power_law_1.01,0.0720192015171051
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,7168,2048,8,384,16,8,balanced,1.712000052134196
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,7168,2048,8,384,16,8,power_law_1.2,0.07857279777526856
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,7168,2048,8,384,16,8,power_law_1.01,0.15178240537643434
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,7168,2048,8,384,16,8,power_law_1.01,0.2151103973388672
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,7168,2048,8,384,16,8,power_law_1.01,0.09114239811897278
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,7168,2048,8,384,16,8,power_law_1.2,0.06796799898147583
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,7168,2048,8,384,16,8,power_law_1.01,0.06710399985313416
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,7168,2048,8,384,16,8,power_law_1.01,0.17074559926986693
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,7168,2048,8,384,16,8,power_law_1.01,0.25182080268859863
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,7168,2048,8,384,16,8,power_law_1.2,0.06585599780082703
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,7168,2048,8,384,16,8,power_law_1.01,0.07352319955825806
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,7168,2048,8,384,16,8,power_law_1.01,0.20905599594116211
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,384,16,8,balanced,0.8911146322886149
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,7168,2048,8,384,16,8,power_law_1.01,0.3072448015213013
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,7168,2048,8,384,16,8,power_law_1.2,0.07157120108604431
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,7168,2048,8,384,16,8,balanced,1.3237439791361492
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,7168,2048,8,384,16,8,power_law_1.01,0.07991679906845092
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,7168,2048,8,384,16,8,power_law_1.01,0.2410111904144287
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,7168,2048,8,384,16,8,power_law_1.2,0.08042880296707153
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,7168,2048,8,384,16,8,power_law_1.01,0.37367680072784426
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,7168,2048,8,384,16,8,power_law_1.01,0.08921599984169007
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,7168,2048,8,384,16,8,power_law_1.01,0.31169281005859373
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,7168,2048,8,384,16,8,power_law_1.2,0.08229119777679443
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,7168,2048,8,384,16,8,power_law_1.01,0.4805823802947998
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,7168,2048,8,384,16,8,power_law_1.01,0.0967423975467682
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,7168,2048,8,384,16,8,power_law_1.01,0.38226559162139895
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,7168,2048,8,384,16,8,power_law_1.2,0.09916800260543823
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,7168,2048,8,384,16,8,power_law_1.01,0.6297344207763672
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,7168,2048,8,384,16,8,power_law_1.01,0.09859840273857116
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,7168,2048,8,384,16,8,power_law_1.01,0.5159359931945801
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,7168,2048,8,384,16,8,power_law_1.2,0.09807360172271729
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,384,16,8,balanced,1.2248160044352214
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,7168,2048,8,384,16,8,power_law_1.01,0.1021888017654419
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,7168,2048,8,384,16,8,power_law_1.01,0.8690431594848633
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,7168,2048,8,384,16,8,power_law_1.01,0.6875264167785644
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,7168,2048,8,384,16,8,power_law_1.2,0.10069119930267334
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,7168,2048,8,384,16,8,power_law_1.01,0.10588159561157226
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,7168,2048,8,384,16,8,power_law_1.01,1.0752063751220704
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,7168,2048,8,384,16,8,power_law_1.2,0.10449919700622559
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,7168,2048,8,384,16,8,power_law_1.01,0.9231231689453125
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,7168,2048,8,384,16,8,power_law_1.01,0.11180800199508667
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,7168,2048,8,384,16,8,power_law_1.2,0.11122560501098633
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,7168,2048,8,384,16,8,power_law_1.01,1.2495231628417969
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,7168,2048,8,384,16,8,power_law_1.01,1.3105279922485351
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,7168,2048,8,384,16,8,power_law_1.01,0.11523840427398682
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,7168,2048,8,384,16,8,power_law_1.2,0.11102720499038696
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,7168,2048,8,384,16,8,power_law_1.01,1.5131135940551759
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,7168,2048,8,384,16,8,power_law_1.01,0.12324479818344117
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,7168,2048,8,384,16,8,power_law_1.01,2.078835105895996
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,7168,2048,8,384,16,8,power_law_1.2,0.12079360485076904
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,7168,2048,8,384,16,8,power_law_1.01,0.13654400110244752
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,7168,2048,8,384,16,8,power_law_1.01,2.414374351501465
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,7168,2048,8,384,16,8,power_law_1.2,0.13355519771575927
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,384,16,8,balanced,1.6477440198262532
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,7168,2048,8,384,16,8,power_law_1.01,4.276953506469726
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,7168,2048,8,384,16,8,power_law_1.01,0.14282239675521852
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,7168,2048,8,384,16,8,power_law_1.2,0.13694080114364623
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,7168,2048,8,384,16,8,balanced,2.055295944213867
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,7168,2048,8,384,16,8,power_law_1.01,4.833740615844727
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,7168,2048,8,384,16,8,power_law_1.01,0.168614399433136
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,7168,2048,8,384,16,8,power_law_1.2,0.14552320241928102
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,7168,2048,8,384,16,8,power_law_1.01,0.19900799989700318
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,7168,2048,8,384,16,8,power_law_1.2,0.1643839955329895
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,7168,2048,8,384,16,8,power_law_1.2,0.18531839847564696
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,7168,2048,8,384,16,8,power_law_1.2,0.2341439962387085
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,384,16,8,power_law_1.01,0.2321216106414795
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,7168,2048,8,384,16,8,power_law_1.2,0.2565696001052856
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,7168,2048,8,384,16,8,power_law_1.2,0.32035839557647705
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,384,16,8,power_law_1.01,0.2808063983917236
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,384,16,8,balanced,2.0351999600728354
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,7168,2048,8,384,16,8,balanced,3.277189254760742
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,7168,2048,8,384,16,8,power_law_1.2,0.39527039527893065
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,384,16,8,power_law_1.01,0.3665343999862671
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,7168,2048,8,384,16,8,power_law_1.2,0.5490880012512207
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,384,16,8,power_law_1.01,0.4670976161956787
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,7168,2048,8,384,16,8,power_law_1.2,0.7023935794830323
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,384,16,8,power_law_1.01,0.5929088115692138
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,7168,2048,8,384,16,8,power_law_1.2,0.9356287956237793
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,384,16,8,power_law_1.01,0.9257087707519531
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,7168,2048,8,384,16,8,power_law_1.2,1.16048002243042
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,384,16,8,power_law_1.01,1.0843520164489746
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,7168,2048,8,384,16,8,power_law_1.2,1.3965120315551758
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,384,16,8,power_law_1.01,1.6550975799560548
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,7168,2048,8,384,16,8,power_law_1.2,2.5668991088867186
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,384,16,8,power_law_1.01,2.064748764038086
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,7168,2048,8,384,16,8,power_law_1.2,5.294822311401367
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,384,16,8,power_law_1.01,2.526131248474121
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,384,16,8,balanced,3.1869548161824546
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,384,16,8,power_law_1.01,4.111897659301758
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,384,16,8,power_law_1.01,9.42007064819336
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,7168,2048,8,384,16,8,balanced,3.971088091532389
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,7168,2048,8,384,16,8,power_law_1.2,0.05320960283279419
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,7168,2048,8,384,16,8,power_law_1.2,0.0630016028881073
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,7168,2048,8,384,16,8,power_law_1.2,0.05748479962348938
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,7168,2048,8,384,16,8,power_law_1.2,0.05720319747924805
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,7168,2048,8,384,16,8,power_law_1.2,0.062745600938797
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,7168,2048,8,384,16,8,power_law_1.2,0.06800000071525573
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,7168,2048,8,384,16,8,power_law_1.2,0.07189120054244995
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,7168,2048,8,384,16,8,power_law_1.2,0.07893120050430298
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,7168,2048,8,384,16,8,power_law_1.2,0.08539519906044006
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,7168,2048,8,384,16,8,power_law_1.2,0.08754559755325317
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,7168,2048,8,384,16,8,power_law_1.2,0.08988800048828124
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,7168,2048,8,384,16,8,power_law_1.2,0.09382399916648865
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,384,16,8,balanced,6.244431813557942
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,7168,2048,8,384,16,8,power_law_1.2,0.09701759815216064
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,7168,2048,8,384,16,8,power_law_1.2,0.10512000322341919
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,7168,2048,8,384,16,8,power_law_1.2,0.11546880006790161
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,7168,2048,8,384,16,8,power_law_1.2,0.12021119594573974
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,7168,2048,8,384,16,8,power_law_1.2,0.13569920063018798
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,7168,2048,8,384,16,8,power_law_1.2,0.15926400423049927
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,7168,2048,8,384,16,8,power_law_1.2,0.1710528016090393
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,7168,2048,8,384,16,8,power_law_1.2,0.2280895948410034
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,7168,2048,8,384,16,8,power_law_1.2,0.24609920978546143
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,7168,2048,8,384,16,8,power_law_1.2,0.3209343910217285
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,7168,2048,8,384,16,8,power_law_1.2,0.40405759811401365
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,7168,2048,8,384,16,8,power_law_1.2,0.5363135814666748
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,7168,2048,8,384,16,8,power_law_1.2,0.7250432014465332
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,7168,2048,8,384,16,8,power_law_1.2,1.0145600318908692
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,7168,2048,8,384,16,8,power_law_1.2,1.3012800216674805
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,7168,2048,8,384,16,8,power_law_1.2,1.6158975601196288
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,7168,2048,8,384,16,8,power_law_1.2,2.636787223815918
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,7168,2048,8,384,16,8,power_law_1.2,5.337715148925781
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,7168,2048,8,384,32,4,balanced,0.056234667698542275
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,7168,2048,8,384,32,4,balanced,0.05765866736570994
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,7168,2048,8,384,16,8,power_law_1.2,0.0638592004776001
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,7168,2048,8,384,32,4,balanced,0.06001600126425425
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,7168,2048,8,384,16,8,power_law_1.2,0.07189760208129883
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,7168,2048,8,384,32,4,balanced,0.0738613357146581
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,7168,2048,8,384,16,8,power_law_1.2,0.07059839963912964
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,7168,2048,8,384,32,4,balanced,0.09028266867001851
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,7168,2048,8,384,16,8,power_law_1.2,0.06951680183410644
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,7168,2048,8,384,32,4,balanced,0.12274133165677388
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,7168,2048,8,384,32,4,balanced,0.04911466439565023
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,7168,2048,8,384,16,8,power_law_1.2,0.07285119891166687
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,7168,2048,8,384,32,4,balanced,0.14869333306948343
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,7168,2048,8,384,32,4,balanced,0.05141866703828176
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,7168,2048,8,384,16,8,power_law_1.2,0.07883520126342773
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,7168,2048,8,384,32,4,balanced,0.14257599910100302
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,7168,2048,8,384,16,8,power_law_1.2,0.08453119993209839
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,7168,2048,8,384,32,4,balanced,0.05384533107280731
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,7168,2048,8,384,32,4,balanced,0.14127467075983682
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,7168,2048,8,384,16,8,power_law_1.2,0.09454079866409301
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,7168,2048,8,384,32,4,balanced,0.14119999607404074
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,7168,2048,8,384,32,4,balanced,0.0626986672480901
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,7168,2048,8,384,16,8,power_law_1.2,0.09936000108718872
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,7168,2048,8,384,32,4,balanced,0.14385066429773966
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,7168,2048,8,384,32,4,balanced,0.07880533238252004
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,7168,2048,8,384,16,8,power_law_1.2,0.09912319779396057
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,7168,2048,8,384,32,4,balanced,0.14709333578745523
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,7168,2048,8,384,32,4,balanced,0.10571199655532837
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,7168,2048,8,384,16,8,power_law_1.2,0.1028607964515686
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,7168,2048,8,384,32,4,balanced,0.13582932949066162
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,7168,2048,8,384,32,4,balanced,0.14682132999102274
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,7168,2048,8,384,16,8,power_law_1.2,0.10995199680328369
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,7168,2048,8,384,32,4,balanced,0.1344373325506846
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,7168,2048,8,384,32,4,balanced,0.14988266428311667
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,7168,2048,8,384,16,8,power_law_1.2,0.11701760292053223
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,7168,2048,8,384,32,4,balanced,0.13525333007176718
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,7168,2048,8,384,32,4,balanced,0.15812266866366068
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,7168,2048,8,384,16,8,power_law_1.2,0.1242751955986023
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,7168,2048,8,384,32,4,balanced,0.1360586682955424
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,7168,2048,8,384,16,8,power_law_1.2,0.13508479595184325
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,7168,2048,8,384,32,4,balanced,0.16195199886957803
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,7168,2048,8,384,16,8,power_law_1.2,0.14357119798660278
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,7168,2048,8,384,32,4,balanced,0.13250666856765747
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,7168,2048,8,384,32,4,balanced,0.16868799924850464
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,7168,2048,8,384,16,8,power_law_1.2,0.16959359645843505
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,7168,2048,8,384,32,4,balanced,0.14110933740933737
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,7168,2048,8,384,16,8,power_law_1.2,0.2159872055053711
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,7168,2048,8,384,32,4,balanced,0.18487467368443808
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,7168,2048,8,384,32,4,balanced,0.14193600416183472
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,7168,2048,8,384,32,4,balanced,0.14406933387120566
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,7168,2048,8,384,32,4,balanced,0.20256000757217407
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,384,16,8,power_law_1.2,0.23336319923400878
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,7168,2048,8,384,32,4,balanced,0.1504533290863037
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,7168,2048,8,384,32,4,balanced,0.23509333531061807
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,7168,2048,8,384,32,4,balanced,0.15541866421699524
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,7168,2048,8,384,32,4,balanced,0.1621386706829071
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,7168,2048,8,384,32,4,balanced,0.2943999965985616
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,384,16,8,power_law_1.2,0.2875391960144043
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,7168,2048,8,384,32,4,balanced,0.18111467361450195
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,384,16,8,power_law_1.2,0.3816256046295166
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,384,16,8,power_law_1.2,0.508070421218872
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,7168,2048,8,384,32,4,balanced,0.3486613432566325
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,7168,2048,8,384,32,4,balanced,0.20541866620381674
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,384,16,8,power_law_1.2,0.6379263877868653
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,384,16,8,power_law_1.2,0.9400832176208496
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,7168,2048,8,384,32,4,balanced,0.24297600984573364
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,7168,2048,8,384,32,4,balanced,0.425983985265096
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,384,16,8,power_law_1.2,1.1744704246520996
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,7168,2048,8,384,32,4,power_law_1.01,0.05850239992141724
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,7168,2048,8,384,32,4,balanced,0.29259733359018963
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,384,16,8,power_law_1.2,1.8374975204467774
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,7168,2048,8,384,32,4,power_law_1.01,0.07284479737281799
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,384,16,8,power_law_1.2,2.579372787475586
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,7168,2048,8,384,32,4,power_law_1.01,0.05243520140647888
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,7168,2048,8,384,32,4,balanced,0.36023465792338055
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,7168,2048,8,384,32,4,power_law_1.01,0.0844543993473053
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,7168,2048,8,384,32,4,balanced,0.571733315785726
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,384,16,8,power_law_1.2,3.1042816162109377
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,7168,2048,8,384,32,4,power_law_1.01,0.058847999572753905
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,7168,2048,8,384,32,4,power_law_1.01,0.06795520186424256
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,384,16,8,power_law_1.2,4.768179321289063
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,7168,2048,8,384,32,4,power_law_1.01,0.08646399974822998
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,7168,2048,8,384,32,4,power_law_1.01,0.07260159850120544
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,7168,2048,8,384,32,4,balanced,0.4442933400472005
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,7168,2048,8,384,32,4,power_law_1.01,0.09941120147705078
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,7168,2048,8,384,32,4,power_law_1.01,0.06349440217018128
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,384,16,8,power_law_1.2,9.792569732666015
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,7168,2048,8,384,32,4,power_law_1.01,0.10747519731521607
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,7168,2048,8,384,32,4,power_law_1.01,0.07395200133323669
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,7168,2048,8,384,32,4,balanced,0.7378453413645426
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,7168,2048,8,384,32,4,power_law_1.01,0.11781120300292969
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,7168,2048,8,384,32,4,power_law_1.01,0.08533759713172913
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,7168,2048,8,384,32,4,balanced,0.609221339225769
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,7168,2048,8,384,32,4,power_law_1.01,0.1182528018951416
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,7168,2048,8,384,32,4,power_law_1.01,0.08977919816970825
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,7168,2048,8,384,32,4,power_law_1.01,0.12445440292358398
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,7168,2048,8,384,32,4,power_law_1.01,0.10587519407272339
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,7168,2048,8,384,32,4,power_law_1.01,0.1263808012008667
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,7168,2048,8,384,32,4,power_law_1.01,0.10728319883346557
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,7168,2048,8,384,32,4,power_law_1.01,0.13506560325622557
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,7168,2048,8,384,32,4,power_law_1.01,0.11344640254974366
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,7168,2048,8,384,32,4,balanced,1.037829319636027
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,7168,2048,8,384,32,4,balanced,0.7933226426442465
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,7168,2048,8,384,32,4,power_law_1.01,0.13779840469360352
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,7168,2048,8,384,32,4,power_law_1.01,0.11544959545135498
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,7168,2048,8,384,32,4,power_law_1.01,0.14082560539245606
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,7168,2048,8,384,32,4,power_law_1.01,0.12154879570007324
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,7168,2048,8,384,32,4,power_law_1.01,0.15264639854431153
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,7168,2048,8,384,32,4,power_law_1.01,0.12414079904556274
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,7168,2048,8,384,32,4,power_law_1.01,0.16049280166625976
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,7168,2048,8,384,32,4,power_law_1.01,0.13173120021820067
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,7168,2048,8,384,32,4,power_law_1.01,0.17616000175476074
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,7168,2048,8,384,32,4,balanced,1.1310453414916992
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,7168,2048,8,384,32,4,power_law_1.01,0.1440384030342102
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,7168,2048,8,384,32,4,power_law_1.01,0.2132159948348999
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,7168,2048,8,384,32,4,power_law_1.01,0.15423359870910644
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,7168,2048,8,384,32,4,balanced,1.3466453552246094
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,7168,2048,8,384,32,4,power_law_1.01,1.4453760147094727
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,7168,2048,8,384,32,4,power_law_1.01,0.159443199634552
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,7168,2048,8,384,32,4,power_law_1.01,1.4859392166137695
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,7168,2048,8,384,32,4,power_law_1.01,0.19842560291290284
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,7168,2048,8,384,32,4,power_law_1.01,0.30392320156097413
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,7168,2048,8,384,32,4,power_law_1.01,0.22330238819122314
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,7168,2048,8,384,32,4,power_law_1.01,0.37988479137420655
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,7168,2048,8,384,32,4,power_law_1.01,0.273855996131897
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,7168,2048,8,384,32,4,power_law_1.01,0.459168004989624
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,7168,2048,8,384,32,4,balanced,1.4731733004252117
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,7168,2048,8,384,32,4,power_law_1.01,0.6430528163909912
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,7168,2048,8,384,32,4,power_law_1.01,0.30449280738830564
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,7168,2048,8,384,32,4,power_law_1.01,0.8294783592224121
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,7168,2048,8,384,32,4,power_law_1.01,0.4025856018066406
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,7168,2048,8,384,32,4,power_law_1.01,1.0963199615478516
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,7168,2048,8,384,32,4,power_law_1.01,0.4864384174346924
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,7168,2048,8,384,32,4,balanced,1.6557706197102864
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,7168,2048,8,384,32,4,power_law_1.01,0.6708223819732666
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,7168,2048,8,384,32,4,power_law_1.01,1.4964351654052734
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,7168,2048,8,384,32,4,power_law_1.01,0.8455488204956054
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,7168,2048,8,384,32,4,power_law_1.01,1.7670911788940429
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,7168,2048,8,384,32,4,power_law_1.01,1.2893888473510742
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,7168,2048,8,384,32,4,power_law_1.01,2.8817983627319337
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,7168,2048,8,384,32,4,power_law_1.01,1.5934783935546875
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,7168,2048,8,384,32,4,balanced,1.8252479235331218
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,7168,2048,8,384,32,4,power_law_1.01,5.0693824768066404
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,7168,2048,8,384,32,4,power_law_1.01,1.9802751541137695
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,7168,2048,8,384,32,4,power_law_1.01,3.1821823120117188
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,7168,2048,8,384,32,4,power_law_1.01,6.037241744995117
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,7168,2048,8,384,32,4,balanced,2.514154593149821
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,7168,2048,8,384,32,4,power_law_1.2,0.058329600095748904
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,7168,2048,8,384,32,4,power_law_1.2,0.07278720140457154
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,7168,2048,8,384,32,4,power_law_1.2,0.07125759720802308
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,7168,2048,8,384,32,4,power_law_1.2,0.07205119729042053
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,7168,2048,8,384,32,4,balanced,2.8201173146565757
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,7168,2048,8,384,32,4,power_law_1.2,0.0838591992855072
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,7168,2048,8,384,32,4,power_law_1.2,0.0976960003376007
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,7168,2048,8,384,32,4,power_law_1.2,0.10377600193023681
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,7168,2048,8,384,32,4,power_law_1.2,0.11325440406799317
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,7168,2048,8,384,32,4,power_law_1.2,0.11912319660186768
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,7168,2048,8,384,32,4,power_law_1.2,0.1238144040107727
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,7168,2048,8,384,32,4,power_law_1.2,0.12254719734191895
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,7168,2048,8,384,32,4,power_law_1.2,0.13509119749069215
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,7168,2048,8,384,32,4,power_law_1.2,0.13749760389328003
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,7168,2048,8,384,32,4,power_law_1.2,0.143014395236969
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,7168,2048,8,384,32,4,power_law_1.2,0.1562175989151001
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,7168,2048,8,384,32,4,power_law_1.2,0.16787199974060057
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,7168,2048,8,384,32,4,power_law_1.2,0.17480319738388062
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,7168,2048,8,384,32,4,power_law_1.2,0.21098880767822265
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,7168,2048,8,384,32,4,power_law_1.2,1.4474752426147461
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,7168,2048,8,384,32,4,power_law_1.2,1.495321559906006
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,7168,2048,8,384,32,4,power_law_1.2,0.3159039974212646
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,7168,2048,8,384,32,4,power_law_1.2,0.4031360149383545
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,7168,2048,8,384,32,4,balanced,4.647226651509603
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,7168,2048,8,384,32,4,power_law_1.2,0.5026432037353515
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,7168,2048,8,384,32,4,power_law_1.2,0.6891136169433594
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,7168,2048,8,384,32,4,power_law_1.2,0.8440959930419922
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,7168,2048,8,384,32,4,power_law_1.2,1.2199616432189941
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,7168,2048,8,384,32,4,balanced,5.425845464070638
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,7168,2048,8,384,32,4,power_law_1.2,1.5899264335632324
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,7168,2048,8,384,32,4,power_law_1.2,2.0220415115356447
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,7168,2048,8,384,32,4,power_law_1.2,3.194278335571289
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,7168,2048,8,384,32,4,power_law_1.2,6.3119873046875
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,7168,2048,8,384,32,4,power_law_1.2,0.051820802688598636
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,7168,2048,8,384,32,4,power_law_1.2,0.058873599767684935
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,7168,2048,8,384,32,4,power_law_1.2,0.05842559933662415
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,7168,2048,8,384,32,4,power_law_1.2,0.06266239881515503
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,7168,2048,8,384,32,4,power_law_1.2,0.07252479791641235
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,7168,2048,8,384,32,4,power_law_1.2,0.08254719972610473
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,7168,2048,8,384,32,4,power_law_1.2,0.08758400082588196
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,7168,2048,8,384,32,4,power_law_1.2,0.10253440141677857
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,7168,2048,8,384,32,4,power_law_1.2,0.10289280414581299
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,7168,2048,8,384,32,4,power_law_1.2,0.11105279922485352
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,7168,2048,8,384,32,4,power_law_1.2,0.11251840591430665
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,7168,2048,8,384,32,4,power_law_1.2,0.11904640197753906
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,7168,2048,8,384,32,4,power_law_1.2,0.13191039562225343
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,7168,2048,8,384,32,4,power_law_1.2,0.13540480136871338
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,7168,2048,8,384,32,4,power_law_1.2,0.14739199876785278
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,7168,2048,8,384,32,4,power_law_1.2,0.15507199764251708
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,7168,2048,8,384,32,4,power_law_1.2,0.166048002243042
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,7168,2048,8,384,32,4,power_law_1.2,0.195961594581604
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,7168,2048,8,384,32,4,power_law_1.2,0.23532159328460694
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,7168,2048,8,384,32,4,power_law_1.2,0.28834559917449953
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,128,1,128,balanced,0.051354666550954185
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,7168,2048,8,384,32,4,power_law_1.2,0.3215167999267578
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,7168,2048,8,384,32,4,power_law_1.2,0.40165119171142577
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,128,1,128,balanced,0.05291733145713806
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,7168,2048,8,384,32,4,power_law_1.2,0.5267519950866699
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,128,1,128,balanced,0.052789335449536644
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,7168,2048,8,384,32,4,power_law_1.2,0.6975168228149414
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,128,1,128,balanced,0.059578667084376015
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,7168,2048,8,384,32,4,power_law_1.2,0.9251584053039551
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,128,1,128,balanced,0.06829333305358887
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,7168,2048,8,384,32,4,power_law_1.2,1.3262399673461913
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,128,1,128,power_law_1.01,0.0513152003288269
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,128,1,128,balanced,0.08436266581217448
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,128,1,128,power_law_1.2,0.05059199929237366
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,128,1,128,balanced,0.07528000076611836
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,128,1,128,power_law_1.01,0.05081599950790405
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,7168,2048,8,384,32,4,power_law_1.2,1.7166976928710938
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,128,1,128,balanced,0.07502399881680806
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,128,1,128,power_law_1.01,0.05070080161094666
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,7168,2048,8,384,32,4,power_law_1.2,2.0698688507080076
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,128,1,128,power_law_1.2,0.05137280225753784
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,128,1,128,balanced,0.08823999762535095
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,128,1,128,power_law_1.01,0.055283200740814206
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,7168,2048,8,384,32,4,power_law_1.2,3.554547119140625
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,128,1,128,power_law_1.2,0.050367999076843264
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,128,1,128,balanced,0.08870933453241985
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,128,1,128,power_law_1.01,0.06039680242538452
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,128,1,128,power_law_1.2,0.055270397663116456
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,128,1,128,balanced,0.08940800031026204
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,7168,2048,8,384,32,4,power_law_1.2,6.553254699707031
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,128,1,128,power_law_1.01,0.06881920099258423
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,128,1,128,power_law_1.2,0.060038399696350095
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,128,1,128,balanced,0.08688533306121826
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,128,1,128,power_law_1.01,0.07106559872627258
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,128,1,128,balanced,0.08577600121498108
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,128,1,128,power_law_1.2,0.06837760210037232
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,128,1,128,power_law_1.01,0.07087360024452209
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,128,1,128,balanced,0.0867199997107188
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,128,1,128,power_law_1.2,0.07057920098304749
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,128,1,128,power_law_1.01,0.08399360179901123
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,128,1,128,balanced,0.08699199557304382
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,128,1,128,power_law_1.2,0.07070720195770264
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,128,1,128,power_law_1.01,0.08407679796218873
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,128,1,128,balanced,0.08726933598518372
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,128,1,128,power_law_1.2,0.08350719809532166
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,128,1,128,balanced,0.08901866277058919
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,128,1,128,power_law_1.01,0.08440960049629212
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,128,1,128,power_law_1.2,0.08364160060882568
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,128,1,128,power_law_1.01,0.08457599878311158
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,128,1,128,balanced,0.09202133615811665
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,128,1,128,power_law_1.2,0.08389120101928711
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,128,1,128,power_law_1.01,0.08488320112228394
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,128,1,128,balanced,0.095551997423172
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,128,1,128,power_law_1.2,0.08414080142974853
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,128,1,128,power_law_1.01,0.08573439717292786
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,128,1,128,power_law_1.2,0.08449919819831848
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,128,1,128,balanced,0.10258133212725322
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,128,1,128,power_law_1.2,0.0855679988861084
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,128,1,128,power_law_1.01,0.08628479838371277
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,128,1,128,balanced,0.11147733529408772
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,128,1,128,power_law_1.2,0.08627200126647949
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,128,1,128,power_law_1.01,0.08710399866104127
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,128,1,128,balanced,0.1291039983431498
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,128,1,128,power_law_1.2,0.08681600093841553
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,128,1,128,power_law_1.01,0.08955519795417785
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,128,1,128,power_law_1.01,0.09594240188598632
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,128,1,128,power_law_1.2,0.09038079977035522
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,128,1,128,balanced,0.14572266737620035
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,128,1,128,power_law_1.01,0.09804800152778625
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,128,1,128,power_law_1.2,0.09508479833602905
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,128,1,128,power_law_1.01,0.12750719785690307
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,128,1,128,power_law_1.2,0.12014720439910889
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,128,1,128,balanced,0.19288533926010132
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,128,1,128,power_law_1.01,0.14937599897384643
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,128,1,128,power_law_1.2,0.12936960458755492
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,128,1,128,power_law_1.2,0.19674240350723265
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,128,1,128,power_law_1.01,0.2111936092376709
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,128,1,128,balanced,0.22927467028299967
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,128,1,128,power_law_1.2,0.2743232011795044
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,128,1,128,power_law_1.01,0.2422976016998291
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,128,1,128,power_law_1.2,0.3214656114578247
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,128,1,128,power_law_1.01,0.3346944093704224
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,128,1,128,power_law_1.2,0.45290241241455076
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,128,1,128,power_law_1.01,0.48226561546325686
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,128,2,64,balanced,0.04454400142033895
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,128,1,128,balanced,0.32607465982437134
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,128,1,128,power_law_1.2,0.6629504203796387
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,128,1,128,power_law_1.01,0.6584512233734131
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,128,2,64,balanced,0.04637866715590159
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,128,1,128,power_law_1.2,0.9464768409729004
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,128,1,128,power_law_1.01,0.8872832298278809
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,128,2,64,balanced,0.046613335609436035
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,128,1,128,power_law_1.2,1.736569595336914
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,128,1,128,power_law_1.01,1.172985553741455
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,128,2,64,balanced,0.047983999053637184
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,128,1,128,power_law_1.2,1.8381887435913087
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,128,1,128,balanced,0.4244426488876343
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,128,1,128,power_law_1.01,2.1266752243041993
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,128,2,64,balanced,0.05117866893609365
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,128,1,128,power_law_1.2,3.4312065124511717
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,128,2,64,balanced,0.05795200169086456
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,128,1,128,power_law_1.01,3.770924758911133
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,128,2,64,balanced,0.06496533254782359
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,128,1,128,power_law_1.2,5.90458869934082
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,128,2,64,power_law_1.01,0.051923197507858274
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,128,2,64,balanced,0.06516266862551372
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,128,2,64,power_law_1.2,0.05182719826698303
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,128,1,128,balanced,0.524832010269165
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,128,2,64,power_law_1.01,0.04656000137329101
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,128,2,64,balanced,0.07226666808128357
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,128,2,64,power_law_1.2,0.04658559858798981
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,128,2,64,power_law_1.01,0.04525440037250519
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,128,2,64,balanced,0.0711946686108907
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,128,2,64,power_law_1.2,0.04455040097236633
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,128,2,64,power_law_1.01,0.04668799936771393
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,128,2,64,balanced,0.07069333394368489
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,128,2,64,power_law_1.2,0.046003198623657225
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,128,2,64,power_law_1.01,0.05162879824638367
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,128,2,64,balanced,0.06899199883143108
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,128,2,64,power_law_1.2,0.050809597969055174
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,128,2,64,balanced,0.07030933101971944
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,128,2,64,power_law_1.01,0.05583360195159912
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,128,2,64,power_law_1.2,0.05730559825897217
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,128,1,128,balanced,0.8251307010650635
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,128,2,64,balanced,0.06955733398596446
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,128,2,64,power_law_1.01,0.06050559878349304
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,128,2,64,power_law_1.2,0.06182399988174438
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,128,2,64,balanced,0.07111999889214833
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,128,2,64,power_law_1.01,0.06253439784049988
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,128,2,64,power_law_1.2,0.06053119897842407
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,128,2,64,power_law_1.01,0.0674239993095398
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,128,2,64,balanced,0.07042133311430614
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,128,2,64,power_law_1.2,0.06721280217170715
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,128,2,64,power_law_1.01,0.06765440106391907
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,128,2,64,balanced,0.07235200206438701
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,128,2,64,power_law_1.2,0.06732800006866455
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,128,2,64,power_law_1.01,0.06780800223350525
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,128,2,64,power_law_1.2,0.06817280054092408
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,128,2,64,balanced,0.07503999769687653
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,128,2,64,power_law_1.01,0.06764159798622131
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,128,2,64,power_law_1.2,0.06746240258216858
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,128,2,64,balanced,0.07939200103282928
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,128,2,64,power_law_1.01,0.06818559765815735
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,128,2,64,power_law_1.2,0.06822400093078614
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,128,2,64,balanced,0.08701866865158081
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,128,2,64,power_law_1.01,0.0690559983253479
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,128,2,64,power_law_1.2,0.06913920044898987
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,128,2,64,balanced,0.09628267089525859
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,128,2,64,power_law_1.01,0.0692799985408783
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,128,2,64,power_law_1.2,0.07211520075798035
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,128,2,64,power_law_1.01,0.06958079934120179
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,128,2,64,power_law_1.2,0.07214720249176025
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,128,2,64,balanced,0.11210133632024129
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,128,2,64,power_law_1.01,0.07306240200996399
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,128,2,64,power_law_1.2,0.07365120053291321
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,128,1,128,balanced,1.6217279434204102
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,128,2,64,power_law_1.01,0.07733759880065919
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,128,2,64,balanced,0.12527466813723245
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,128,2,64,power_law_1.2,0.08030719757080078
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,128,2,64,power_law_1.01,0.0811456024646759
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,128,2,64,power_law_1.2,0.0917952001094818
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,128,2,64,balanced,0.17425066232681274
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,128,2,64,power_law_1.01,0.08970239758491516
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,128,2,64,power_law_1.2,0.12464640140533448
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,128,2,64,power_law_1.01,0.11743359565734864
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,128,2,64,power_law_1.2,0.1410048007965088
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,128,4,32,balanced,0.033157333731651306
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,128,2,64,balanced,0.21249600251515707
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,128,2,64,power_law_1.01,0.16563839912414552
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,128,2,64,power_law_1.2,0.1939903974533081
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,128,4,32,balanced,0.034490667283535004
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,128,2,64,power_law_1.2,0.25608320236206056
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,128,2,64,power_law_1.01,0.2094208002090454
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,128,4,32,balanced,0.03421333432197571
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,128,4,32,balanced,0.036858665446440377
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,128,2,64,power_law_1.01,0.2568576097488403
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,128,2,64,power_law_1.2,0.3900288105010986
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,128,2,64,balanced,0.30845866600672406
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,128,4,32,balanced,0.04186133543650309
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,128,2,64,power_law_1.01,0.37826559543609617
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,128,2,64,power_law_1.2,0.43279361724853516
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,128,4,32,balanced,0.046256000796953835
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,128,2,64,power_law_1.01,0.5272128105163574
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,128,2,64,power_law_1.2,0.7357888221740723
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,128,4,32,balanced,0.04842133323351542
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,128,2,64,power_law_1.01,0.7223296165466309
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,128,2,64,power_law_1.2,0.9259584426879883
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,128,4,32,balanced,0.05117333432038625
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,128,2,64,balanced,0.398634672164917
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,128,2,64,power_law_1.2,1.2598848342895508
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,128,2,64,power_law_1.01,0.90250244140625
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,128,4,32,balanced,0.06116800010204315
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,128,4,32,power_law_1.01,0.03463039994239807
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,128,2,64,power_law_1.2,2.0797183990478514
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,128,2,64,power_law_1.01,1.3829504013061524
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,128,4,32,balanced,0.06111466884613037
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,128,4,32,power_law_1.01,0.03500159978866577
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,128,2,64,power_law_1.2,4.221651077270508
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,128,2,64,power_law_1.01,2.729644775390625
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,128,4,32,power_law_1.01,0.03464959859848023
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,128,4,32,balanced,0.05789866546789805
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,128,4,32,power_law_1.01,0.03900800049304962
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,128,4,32,balanced,0.05782933533191681
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,128,2,64,balanced,0.49318933486938477
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,128,4,32,power_law_1.01,0.041606399416923526
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,128,4,32,power_law_1.01,0.04509440064430237
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,128,4,32,balanced,0.06172266602516174
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,128,4,32,power_law_1.01,0.047244799137115476
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,128,4,32,power_law_1.01,0.049753600358963014
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,128,4,32,balanced,0.06124266485373179
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,128,4,32,power_law_1.01,0.05924479961395264
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,128,4,32,balanced,0.06163200239340464
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,128,4,32,power_law_1.01,0.06197119951248169
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,128,4,32,power_law_1.01,0.05601919889450073
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,128,4,32,balanced,0.06159999966621399
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,128,4,32,power_law_1.01,0.060115200281143186
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,128,4,32,balanced,0.06311999758084615
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,128,4,32,power_law_1.01,0.06090239882469177
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,128,2,64,balanced,0.7709226608276367
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,128,4,32,power_law_1.01,0.06251519918441772
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,128,4,32,balanced,0.06588799754778545
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,128,4,32,power_law_1.01,0.06313599944114685
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,128,4,32,power_law_1.01,0.06161919832229614
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,128,4,32,balanced,0.06956799825032552
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,128,4,32,power_law_1.01,0.06641280055046081
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,128,4,32,balanced,0.07696000238259633
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,128,4,32,power_law_1.01,0.07022079825401306
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,128,4,32,balanced,0.08822932839393616
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,128,4,32,power_law_1.01,0.08350719809532166
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,128,4,32,balanced,0.10702932874361674
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,128,4,32,power_law_1.01,0.09266560077667237
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,128,4,32,power_law_1.01,0.10102399587631225
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,128,4,32,power_law_1.01,0.14807039499282837
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,128,4,32,balanced,0.12304000059763591
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,128,4,32,power_law_1.01,0.17002880573272705
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,128,4,32,power_law_1.01,0.2348479986190796
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,128,4,32,balanced,0.16940800348917642
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,128,4,32,power_law_1.01,0.30436480045318604
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,128,4,32,power_law_1.01,0.44768638610839845
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,128,4,32,power_law_1.01,0.5623616218566895
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,128,4,32,balanced,0.20533865690231323
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,128,4,32,power_law_1.01,0.6829760074615479
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,128,2,64,balanced,1.522607962290446
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,128,4,32,power_law_1.01,1.065548801422119
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,128,4,32,power_law_1.01,2.2365055084228516
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,128,4,32,balanced,0.29843733708063763
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,128,8,16,balanced,0.029274667302767437
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,128,4,32,balanced,0.38342400391896564
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,128,4,32,power_law_1.2,0.03443840146064758
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,128,8,16,balanced,0.032501332461833954
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,128,4,32,power_law_1.2,0.034841600060462954
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,128,8,16,balanced,0.03271466741959254
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,128,4,32,power_law_1.2,0.033555200695991515
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,128,8,16,balanced,0.03389866650104523
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,128,8,16,balanced,0.03559466699759165
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,128,4,32,power_law_1.2,0.03758080005645752
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,128,4,32,balanced,0.4719626506169637
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,128,8,16,balanced,0.03755199909210205
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,128,4,32,power_law_1.2,0.04090240001678467
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,128,8,16,balanced,0.0410453329483668
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,128,4,32,power_law_1.2,0.045132800936698914
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,128,8,16,balanced,0.04074666649103165
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,128,4,32,power_law_1.2,0.04787839949131012
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,128,8,16,balanced,0.04507733384768168
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,128,4,32,power_law_1.2,0.05013759732246399
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,128,4,32,power_law_1.2,0.05966079831123352
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,128,8,16,balanced,0.04524266719818115
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,128,4,32,power_law_1.2,0.06428800225257873
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,128,8,16,balanced,0.04458666841189066
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,128,4,32,balanced,0.7418719927469889
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,128,4,32,power_law_1.2,0.060211199522018435
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,128,8,16,balanced,0.05996266504128774
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,128,4,32,power_law_1.2,0.0564736008644104
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,128,8,16,balanced,0.06281066437562306
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,128,4,32,power_law_1.2,0.06250240206718445
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,128,8,16,balanced,0.05691199998060862
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,128,4,32,power_law_1.2,0.06339840292930603
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,128,8,16,balanced,0.05776533484458923
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,128,4,32,power_law_1.2,0.06484479904174804
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,128,8,16,balanced,0.06371733546257019
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,128,4,32,power_law_1.2,0.0642304003238678
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,128,8,16,balanced,0.06525866687297821
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,128,4,32,power_law_1.2,0.06755200028419495
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,128,8,16,balanced,0.06905599931875865
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,128,8,16,power_law_1.01,0.030169600248336793
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,128,4,32,power_law_1.2,0.07562879920005798
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,128,8,16,balanced,0.07314133147398631
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,128,4,32,power_law_1.2,0.08777599930763244
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,128,8,16,power_law_1.01,0.03374719917774201
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,128,8,16,balanced,0.08179733157157898
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,128,4,32,power_law_1.2,0.09567999839782715
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,128,8,16,power_law_1.01,0.03288959860801697
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,128,4,32,power_law_1.2,0.11931519508361817
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,128,8,16,power_law_1.01,0.034560000896453856
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,128,8,16,balanced,0.09131200114885966
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,128,8,16,power_law_1.01,0.03568640053272247
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,128,4,32,power_law_1.2,0.16457600593566896
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,128,4,32,balanced,1.455674648284912
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,128,8,16,balanced,0.11020267009735107
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,128,8,16,power_law_1.01,0.03694719970226288
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,128,4,32,power_law_1.2,0.18422399759292601
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,128,8,16,power_law_1.01,0.04048640131950378
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,128,4,32,power_law_1.2,0.2730112075805664
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,128,8,16,balanced,0.12622933586438498
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,128,8,16,power_law_1.01,0.03909119963645935
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,128,4,32,power_law_1.2,0.3669183969497681
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,128,8,16,power_law_1.01,0.044659200310707095
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,128,4,32,power_law_1.2,0.4961728096008301
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,128,8,16,balanced,0.17259732882181802
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,128,8,16,power_law_1.01,0.04506239891052246
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,128,4,32,power_law_1.2,0.7526463985443115
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,128,8,16,power_law_1.01,0.04300160109996796
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,128,4,32,power_law_1.2,0.7962624073028565
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,128,8,16,balanced,0.2059733271598816
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,128,8,16,power_law_1.01,0.06097279787063599
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,128,4,32,power_law_1.2,1.5080320358276367
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,128,8,16,power_law_1.2,0.030073601007461547
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,128,8,16,power_law_1.01,0.060678398609161376
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,128,16,8,balanced,0.0266239990790685
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,128,4,32,power_law_1.2,3.00634880065918
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,128,8,16,balanced,0.30532266696294147
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,128,8,16,power_law_1.2,0.03341439962387085
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,128,8,16,power_law_1.01,0.06225919723510742
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,128,16,8,balanced,0.028437333802382152
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,128,8,16,power_law_1.2,0.031590399146080014
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,128,8,16,power_law_1.01,0.05818880200386047
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,128,16,8,balanced,0.02861333390076955
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,128,8,16,power_law_1.2,0.034764799475669864
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,128,8,16,power_law_1.01,0.0651968002319336
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,128,16,8,balanced,0.033701332906881966
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,128,8,16,power_law_1.2,0.035366401076316833
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,128,8,16,power_law_1.01,0.06711040139198303
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,128,16,8,balanced,0.0352906659245491
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,128,8,16,balanced,0.3821226755777995
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,128,8,16,power_law_1.2,0.03644160032272339
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,128,8,16,power_law_1.01,0.07294719815254211
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,128,16,8,balanced,0.0377866675456365
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,128,8,16,power_law_1.2,0.040633600950241086
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,128,8,16,power_law_1.01,0.07771520018577575
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,128,16,8,balanced,0.0383146678407987
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,128,8,16,power_law_1.2,0.03937920033931732
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,128,16,8,balanced,0.03810133288304011
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,128,8,16,power_law_1.01,0.08837119936943054
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,128,8,16,power_law_1.2,0.04450559914112091
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,128,16,8,balanced,0.04090133309364319
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,128,8,16,power_law_1.01,0.10218240022659301
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,128,8,16,power_law_1.2,0.045433598756790164
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,128,8,16,balanced,0.4715199867884318
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,128,16,8,balanced,0.03985599925120672
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,128,8,16,power_law_1.01,0.12361600399017333
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,128,8,16,power_law_1.2,0.044275200366973876
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,128,16,8,balanced,0.04041066765785217
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,128,8,16,power_law_1.01,0.16212480068206786
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,128,8,16,power_law_1.2,0.06223359704017639
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,128,16,8,balanced,0.0489333321650823
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,128,8,16,power_law_1.01,0.2254080057144165
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,128,8,16,power_law_1.2,0.05611519813537598
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,128,16,8,balanced,0.04721599817276001
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,128,8,16,power_law_1.2,0.05973119735717773
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,128,8,16,power_law_1.01,0.27859840393066404
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,128,16,8,balanced,0.047279998660087585
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,128,8,16,power_law_1.2,0.0598143994808197
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,128,8,16,power_law_1.01,0.3930367946624756
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,128,16,8,balanced,0.06753066678841908
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,128,8,16,power_law_1.2,0.06625919938087463
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,128,8,16,power_law_1.01,0.4915520191192627
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,128,16,8,balanced,0.0624533345301946
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,128,8,16,balanced,0.7353546619415283
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,128,8,16,power_law_1.2,0.06850559711456299
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,128,8,16,power_law_1.01,0.6338624000549317
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,128,16,8,balanced,0.06490666667620341
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,128,8,16,power_law_1.2,0.07643520236015319
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,128,8,16,power_law_1.01,1.0994048118591309
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,128,16,8,balanced,0.07606400052706401
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,128,8,16,power_law_1.2,0.07946239709854126
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,128,16,8,power_law_1.01,0.027833598852157592
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,128,8,16,power_law_1.01,1.97523193359375
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,128,16,8,balanced,0.08072533210118611
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,128,8,16,power_law_1.2,0.09452800154685974
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,128,16,8,power_law_1.2,0.027539199590682982
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,128,8,16,power_law_1.2,0.10311679840087891
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,128,16,8,power_law_1.01,0.03152639865875244
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,128,16,8,balanced,0.09007466832796733
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,128,16,8,power_law_1.2,0.031052801012992858
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,128,8,16,power_law_1.2,0.13752319812774658
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,128,16,8,power_law_1.01,0.029120001196861266
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,128,16,8,power_law_1.2,0.029164800047874452
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,128,16,8,balanced,0.0997279981772105
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,128,8,16,power_law_1.2,0.17868160009384154
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,128,16,8,power_law_1.01,0.03240320086479187
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,128,16,8,power_law_1.2,0.03280639946460724
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,128,16,8,balanced,0.11742933591206868
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,128,8,16,power_law_1.2,0.26755199432373045
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,128,16,8,power_law_1.01,0.034944000840187076
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,128,16,8,power_law_1.2,0.03364480137825012
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,128,8,16,power_law_1.2,0.30674560070037843
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,128,16,8,balanced,0.1343893309434255
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,128,16,8,power_law_1.01,0.03583360016345978
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,128,16,8,power_law_1.2,0.036185601353645326
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,128,8,16,power_law_1.2,0.43640961647033694
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,128,16,8,power_law_1.01,0.0381056010723114
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,128,16,8,power_law_1.2,0.03809280097484589
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,128,8,16,power_law_1.2,0.5712639808654785
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,128,16,8,balanced,0.1884053349494934
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,128,16,8,power_law_1.01,0.03874559998512268
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,128,16,8,power_law_1.2,0.03776000142097473
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,128,8,16,power_law_1.2,0.6923007965087891
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,128,8,16,balanced,1.4415839513142903
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,128,16,8,power_law_1.01,0.04154239892959595
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,128,16,8,power_law_1.2,0.04131200015544891
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,128,8,16,power_law_1.2,1.3558208465576171
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,128,16,8,balanced,0.22402666012446085
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,128,16,8,power_law_1.01,0.04037120044231415
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,128,16,8,power_law_1.2,0.039705601334571836
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,128,8,16,power_law_1.2,2.337356758117676
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,128,16,8,power_law_1.01,0.04100480079650879
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,128,16,8,power_law_1.2,0.04110719859600067
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,128,16,8,power_law_1.01,0.04878720045089722
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,128,16,8,power_law_1.2,0.04880639910697937
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,128,16,8,balanced,0.3279946645100911
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,128,16,8,power_law_1.01,0.04572800099849701
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,128,16,8,power_law_1.2,0.04661760032176972
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,128,16,8,power_law_1.01,0.04695039987564087
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,128,16,8,power_law_1.2,0.0493120014667511
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,128,16,8,power_law_1.01,0.06856319904327393
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,128,16,8,power_law_1.2,0.0707647979259491
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,128,16,8,balanced,0.4188053210576375
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,128,16,8,power_law_1.01,0.06317440271377564
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,128,16,8,power_law_1.2,0.06726400256156921
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,128,16,8,power_law_1.01,0.06558719873428345
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,128,16,8,power_law_1.2,0.07075200080871583
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,128,16,8,power_law_1.01,0.07834879755973816
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,128,16,8,power_law_1.2,0.08186879754066467
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,128,16,8,power_law_1.01,0.0865664005279541
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,128,16,8,power_law_1.2,0.08731520175933838
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,128,16,8,power_law_1.01,0.09857280254364013
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,128,16,8,balanced,0.5207519928614298
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,128,16,8,power_law_1.2,0.09813759922981262
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,128,16,8,power_law_1.01,0.10542720556259155
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,128,16,8,power_law_1.2,0.12082560062408447
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,128,16,8,power_law_1.01,0.13199360370635987
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,128,16,8,power_law_1.2,0.15329279899597167
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,128,16,8,power_law_1.01,0.18154879808425903
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,128,16,8,power_law_1.2,0.18652160167694093
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,128,16,8,power_law_1.01,0.23654398918151856
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,128,16,8,power_law_1.01,0.28709120750427247
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,128,16,8,power_law_1.2,0.26086399555206297
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,128,16,8,power_law_1.01,0.4190080165863037
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,128,16,8,power_law_1.2,0.3231168031692505
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,128,16,8,balanced,0.8067359924316406
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,128,16,8,power_law_1.01,0.558022403717041
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,128,32,4,balanced,0.02643200010061264
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,128,16,8,power_law_1.2,0.42936320304870607
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,128,16,8,power_law_1.01,0.626803207397461
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,128,32,4,balanced,0.028192001084486645
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,128,16,8,power_law_1.2,0.5979968070983886
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,128,16,8,power_law_1.01,1.0111616134643555
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,128,32,4,balanced,0.028736000259717304
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,128,32,4,balanced,0.0323786661028862
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,128,16,8,power_law_1.2,0.7284224033355713
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,128,16,8,power_law_1.01,1.9825599670410157
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,128,32,4,balanced,0.035029334326585136
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,128,32,4,balanced,0.04014399896065394
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,128,16,8,power_law_1.2,1.2860032081604005
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,128,32,4,balanced,0.04033066580692927
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,128,32,4,balanced,0.03897066662708918
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,128,32,4,balanced,0.04004266609748205
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,128,16,8,power_law_1.2,2.3833663940429686
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,128,32,4,balanced,0.039919999738534294
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,128,32,4,power_law_1.01,0.026707199215888978
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,128,32,4,balanced,0.040607998768488564
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,128,32,4,balanced,0.043712000052134194
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,128,32,4,power_law_1.01,0.028467199206352232
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,128,32,4,balanced,0.04343999922275543
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,128,32,4,power_law_1.01,0.028288000822067262
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,128,32,4,balanced,0.04378133515516917
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,128,32,4,balanced,0.051402668158213295
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,128,32,4,power_law_1.01,0.030873599648475646
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,128,16,8,balanced,1.579744021097819
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,128,32,4,balanced,0.051685333251953125
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,128,32,4,power_law_1.01,0.03384959995746613
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,128,32,4,balanced,0.054272000988324486
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,128,32,4,power_law_1.01,0.034841600060462954
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,128,32,4,balanced,0.07957333326339722
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,128,32,4,balanced,0.08540266752243042
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,128,32,4,power_law_1.01,0.03863680064678192
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,128,32,4,balanced,0.09904533624649048
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,128,32,4,power_law_1.01,0.03682560026645661
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,128,32,4,power_law_1.01,0.03861759901046753
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,128,32,4,balanced,0.10875200231870015
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,128,32,4,power_law_1.01,0.03929600119590759
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,128,32,4,balanced,0.1271519958972931
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,128,32,4,power_law_1.01,0.04042240083217621
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,128,32,4,power_law_1.01,0.043263998627662656
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,128,32,4,balanced,0.14516799648602804
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,128,32,4,power_law_1.01,0.04215039908885956
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,128,32,4,power_law_1.01,0.043296000361442565
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,128,32,4,power_law_1.01,0.05121279954910278
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,128,32,4,balanced,0.20569600661595663
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,128,32,4,power_law_1.01,0.05101439952850342
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,128,32,4,power_law_1.01,0.053286397457122804
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,128,32,4,power_law_1.01,0.08107519745826722
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,128,32,4,balanced,0.2423306703567505
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,128,32,4,power_law_1.01,0.08863999843597412
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,128,32,4,power_law_1.01,0.1061568021774292
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,128,32,4,power_law_1.01,0.11745920181274414
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,128,32,4,power_law_1.01,0.14321919679641723
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,128,32,4,balanced,0.35599998633066815
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,128,32,4,power_law_1.2,0.026892799139022826
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,128,32,4,power_law_1.01,0.17433600425720214
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,128,32,4,power_law_1.2,0.028364801406860353
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,128,32,4,power_law_1.01,0.240447998046875
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,128,32,4,power_law_1.01,0.29872000217437744
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,128,32,4,power_law_1.2,0.02794879972934723
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,128,32,4,power_law_1.01,0.4540031909942627
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,128,32,4,balanced,0.45291733741760254
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,128,32,4,power_law_1.2,0.03084160089492798
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,128,32,4,power_law_1.01,0.546566390991211
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,128,32,4,power_law_1.2,0.033913600444793704
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,128,32,4,power_law_1.01,0.6959936141967773
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,128,32,4,power_law_1.2,0.03472639918327332
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,128,32,4,power_law_1.01,1.0457663536071777
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,128,32,4,power_law_1.2,0.03871360123157501
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,128,32,4,power_law_1.01,1.9969152450561523
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,128,32,4,power_law_1.2,0.03765760064125061
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,128,32,4,balanced,0.5673706531524658
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,128,32,4,power_law_1.2,0.03800320029258728
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,128,32,4,power_law_1.2,0.03933440148830414
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,128,32,4,power_law_1.2,0.04051840007305145
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,128,32,4,power_law_1.2,0.043680000305175784
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,128,32,4,power_law_1.2,0.04245119988918304
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,128,32,4,power_law_1.2,0.0455808013677597
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,32,4,32,balanced,0.030778666337331135
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,32,4,32,power_law_1.01,0.030348798632621764
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,128,32,4,power_law_1.2,0.05236480236053467
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,128,32,4,balanced,0.8750399748484293
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,32,4,32,balanced,0.032298666735490165
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,32,4,32,power_law_1.01,0.031046399474143983
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,128,32,4,power_law_1.2,0.05338240265846252
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,128,32,4,power_law_1.2,0.057920002937316896
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,32,4,32,balanced,0.032042667269706726
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,32,4,32,power_law_1.01,0.030905601382255555
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,128,32,4,power_law_1.2,0.0942911982536316
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,128,32,4,power_law_1.2,0.09110400080680847
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,32,4,32,balanced,0.036330667634805046
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,32,4,32,power_law_1.01,0.034092798829078674
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,128,32,4,power_law_1.2,0.1098688006401062
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,128,32,4,power_law_1.2,0.11905280351638795
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,128,32,4,power_law_1.2,0.15871360301971435
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,32,4,32,power_law_1.01,0.037376001477241516
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,32,4,32,balanced,0.03955200066169103
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,128,32,4,power_law_1.2,0.18173439502716066
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,128,32,4,power_law_1.2,0.25571839809417723
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,128,32,4,power_law_1.2,0.33108479976654054
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,32,4,32,balanced,0.04706133405367533
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,32,4,32,power_law_1.01,0.046105599403381346
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,128,32,4,power_law_1.2,0.49057278633117674
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,128,32,4,balanced,1.7073599497477214
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,128,32,4,power_law_1.2,0.5874815940856933
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,128,32,4,power_law_1.2,0.7287360191345215
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,32,4,32,balanced,0.04690133531888326
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,32,4,32,power_law_1.01,0.04604159891605377
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,128,32,4,power_law_1.2,1.112492847442627
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,32,4,32,balanced,0.04729066789150238
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,32,4,32,power_law_1.01,0.046348801255226134
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,128,32,4,power_law_1.2,2.4656768798828126
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,32,4,32,power_law_1.2,0.030720001459121703
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,32,4,32,balanced,0.048245335618654885
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,32,4,32,power_law_1.2,0.03107840120792389
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,32,4,32,power_law_1.01,0.047839999198913574
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,32,4,32,balanced,0.04832000037034353
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,32,4,32,power_law_1.01,0.04767360091209412
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,32,4,32,power_law_1.2,0.031033599376678468
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,32,4,32,balanced,0.0509493350982666
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,32,4,32,power_law_1.01,0.05055360198020935
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,32,4,32,power_law_1.2,0.03412480056285858
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,32,4,32,balanced,0.050698667764663696
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,32,4,32,power_law_1.2,0.03711360096931458
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,32,4,32,power_law_1.01,0.05101439952850342
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,32,8,16,balanced,0.02770666778087616
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,32,4,32,balanced,0.05829333265622457
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,32,4,32,power_law_1.2,0.046540799736976626
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,32,4,32,power_law_1.01,0.057171201705932616
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,32,8,16,balanced,0.028927999238173168
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,32,4,32,balanced,0.05817066629727682
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,32,4,32,power_law_1.2,0.04661119878292084
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,32,4,32,power_law_1.01,0.05797759890556335
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,32,8,16,balanced,0.028650666276613872
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,32,4,32,balanced,0.05880000193913778
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,32,4,32,power_law_1.2,0.046412798762321475
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,32,4,32,power_law_1.01,0.0588096022605896
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,32,8,16,balanced,0.03276266654332479
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,32,4,32,balanced,0.05885333319505056
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,32,4,32,power_law_1.2,0.04805760085582733
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,32,8,16,balanced,0.03392533212900162
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,32,4,32,power_law_1.01,0.05914239883422852
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,32,4,32,balanced,0.06058666606744131
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,32,4,32,power_law_1.2,0.04782080054283142
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,32,8,16,balanced,0.03585066646337509
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,32,4,32,power_law_1.2,0.05062400102615357
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,32,4,32,power_law_1.01,0.060172802209854125
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,32,4,32,balanced,0.06238399942715963
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,32,8,16,power_law_1.01,0.028537601232528687
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,32,8,16,balanced,0.041840001940727234
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,32,4,32,power_law_1.2,0.051551997661590576
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,32,4,32,power_law_1.01,0.06472319960594178
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,32,4,32,balanced,0.06584533552328746
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,32,8,16,balanced,0.041450666884581246
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,32,8,16,power_law_1.01,0.028217598795890808
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,32,4,32,power_law_1.2,0.05783039927482605
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,32,4,32,power_law_1.01,0.0766975998878479
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,32,4,32,balanced,0.07282666862010956
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,32,8,16,power_law_1.01,0.0286080002784729
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,32,8,16,balanced,0.041706666350364685
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,32,4,32,power_law_1.2,0.05829120278358459
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,32,4,32,power_law_1.01,0.10180480480194092
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,32,8,16,balanced,0.04203199843565623
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,32,8,16,power_law_1.01,0.031462401151657104
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,32,4,32,balanced,0.08120533327261607
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,32,4,32,power_law_1.2,0.05961599946022034
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,32,4,32,power_law_1.01,0.12117760181427002
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,32,8,16,balanced,0.04251199960708618
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,32,8,16,power_law_1.01,0.03312000036239624
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,32,4,32,power_law_1.2,0.05920000076293945
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,32,4,32,power_law_1.01,0.1691200017929077
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,32,4,32,balanced,0.1011946698029836
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,32,8,16,power_law_1.01,0.03555200099945068
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,32,4,32,power_law_1.2,0.06076800227165222
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,32,4,32,power_law_1.01,0.21247360706329346
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,32,8,16,power_law_1.01,0.040934398770332336
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,32,4,32,power_law_1.2,0.07206400036811829
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,32,4,32,balanced,0.11817600329717
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,32,8,16,power_law_1.01,0.04165120124816894
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,32,4,32,power_law_1.01,0.3162175893783569
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,32,4,32,power_law_1.2,0.07939199805259704
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,32,8,16,balanced,0.042821332812309265
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,32,8,16,power_law_1.01,0.04173440039157868
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,32,4,32,power_law_1.01,0.4013055801391602
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,32,4,32,power_law_1.2,0.11082240343093872
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,32,4,32,balanced,0.15793599685033163
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,32,8,16,balanced,0.044826666514078774
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,32,8,16,power_law_1.01,0.04166400134563446
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,32,4,32,power_law_1.2,0.13343360424041747
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,32,4,32,power_law_1.01,0.6130815982818604
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,32,8,16,balanced,0.04746133089065552
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,32,8,16,power_law_1.01,0.041945600509643556
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,32,4,32,power_law_1.2,0.19165439605712892
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,32,4,32,power_law_1.01,0.783622407913208
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,32,4,32,balanced,0.19788267215092978
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,32,8,16,balanced,0.04790933430194855
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,32,8,16,power_law_1.01,0.0426367998123169
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,32,4,32,power_law_1.2,0.22860798835754395
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,32,4,32,power_law_1.01,0.9668671607971191
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,32,8,16,balanced,0.05524266759554545
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,32,8,16,power_law_1.01,0.044275200366973876
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,32,4,32,power_law_1.2,0.3340543985366821
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,32,4,32,power_law_1.01,1.5233920097351075
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,32,8,16,power_law_1.01,0.04767360091209412
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,32,8,16,balanced,0.05673066775004069
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,32,4,32,power_law_1.2,0.43508481979370117
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,32,4,32,balanced,0.2894879976908366
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,32,4,32,power_law_1.01,3.195027160644531
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,32,8,16,power_law_1.01,0.04895359873771667
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,32,8,16,balanced,0.05835733314355215
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,32,4,32,power_law_1.2,0.6391295909881591
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,32,8,16,power_law_1.01,0.0547327995300293
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,32,8,16,balanced,0.0621066689491272
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,32,4,32,power_law_1.2,0.8458368301391601
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,32,8,16,power_law_1.01,0.05729920268058777
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,32,4,32,power_law_1.2,1.0504639625549317
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,32,8,16,balanced,0.07106666763623555
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,32,8,16,power_law_1.01,0.0659712016582489
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,32,4,32,balanced,0.37271467844645184
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,32,4,32,power_law_1.2,1.6656255722045898
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,32,8,16,balanced,0.0824533353249232
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,32,8,16,power_law_1.01,0.070796799659729
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,32,8,16,power_law_1.2,0.028441599011421202
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,32,4,32,power_law_1.2,3.301715087890625
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,32,8,16,power_law_1.01,0.08251519799232483
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,32,8,16,balanced,0.10352533062299092
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,32,8,16,power_law_1.2,0.028288000822067262
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,32,8,16,power_law_1.01,0.09912959933280945
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,32,8,16,power_law_1.2,0.0286655992269516
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,32,8,16,power_law_1.01,0.14623359441757203
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,32,8,16,balanced,0.12219199538230896
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,32,8,16,power_law_1.2,0.03113600015640259
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,32,4,32,balanced,0.4598720073699951
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,32,8,16,power_law_1.01,0.18569600582122803
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,32,8,16,power_law_1.2,0.03312000036239624
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,32,8,16,power_law_1.01,0.29246718883514405
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,32,8,16,balanced,0.1623306671778361
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,32,8,16,power_law_1.2,0.035699200630187986
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,32,8,16,power_law_1.01,0.32394239902496336
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,32,8,16,power_law_1.2,0.04100480079650879
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,32,8,16,power_law_1.01,0.49831042289733884
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,32,8,16,balanced,0.20006400346755981
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,32,8,16,power_law_1.2,0.041331198811531064
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,32,8,16,power_law_1.01,0.718675184249878
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,32,8,16,power_law_1.2,0.04234879910945892
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,32,8,16,power_law_1.01,0.8439488410949707
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,32,8,16,power_law_1.2,0.04170880019664765
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,32,4,32,balanced,0.7204106648763021
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,32,8,16,balanced,0.29630400737126666
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,32,8,16,power_law_1.01,1.4493887901306153
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,32,8,16,power_law_1.2,0.04206080138683319
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,32,8,16,power_law_1.2,0.04294399917125702
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,32,8,16,power_law_1.01,2.5369279861450194
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,32,8,16,power_law_1.2,0.04471679925918579
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,32,8,16,power_law_1.2,0.047686401009559634
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,32,8,16,balanced,0.37195734182993573
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,32,8,16,power_law_1.2,0.04896000027656555
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,32,8,16,power_law_1.2,0.055276799201965335
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,32,8,16,power_law_1.2,0.05688959956169128
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,32,8,16,power_law_1.2,0.06897280216217042
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,32,8,16,power_law_1.2,0.07315840125083924
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,32,8,16,balanced,0.46010132630666095
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,32,8,16,power_law_1.2,0.09003520011901855
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,32,16,8,balanced,0.025983999172846477
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,32,8,16,power_law_1.2,0.11611520051956177
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,32,16,8,balanced,0.027221334477265675
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,32,8,16,power_law_1.2,0.1803264021873474
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,32,4,32,balanced,1.4235893885294597
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,32,16,8,balanced,0.027855999767780304
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,32,8,16,power_law_1.2,0.2164223909378052
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,32,16,8,balanced,0.03178666780392329
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,32,8,16,power_law_1.2,0.31651840209960935
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,32,16,8,balanced,0.031925333042939506
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,32,8,16,power_law_1.2,0.4050111770629883
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,32,8,16,balanced,0.7218506336212158
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,32,16,8,balanced,0.0332640012105306
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,32,8,16,power_law_1.2,0.6603456020355225
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,32,16,8,balanced,0.035717333356539406
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,32,8,16,power_law_1.2,0.7993152141571045
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,32,16,8,power_law_1.01,0.02650879919528961
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,32,16,8,balanced,0.035818666219711304
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,32,8,16,power_law_1.2,1.0599679946899414
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,32,16,8,power_law_1.01,0.02682879865169525
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,32,16,8,balanced,0.039701332648595176
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,32,8,16,power_law_1.2,1.4421631813049316
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,32,16,8,power_law_1.01,0.027750399708747864
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,32,16,8,balanced,0.03994666785001755
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,32,16,8,power_law_1.01,0.029734399914741517
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,32,8,16,power_law_1.2,3.3079742431640624
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,32,16,8,balanced,0.04070399949947993
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,32,16,8,power_law_1.01,0.031276801228523256
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,32,16,8,balanced,0.040618665516376495
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,32,16,8,power_law_1.01,0.03278720080852508
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,32,16,8,balanced,0.04148799926042557
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,32,16,8,power_law_1.01,0.034764799475669864
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,32,16,8,balanced,0.041989331444104515
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,32,16,8,power_law_1.01,0.0351936012506485
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,32,16,8,balanced,0.043712000052134194
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,32,16,8,power_law_1.01,0.040115201473236085
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,32,16,8,balanced,0.04762133459250132
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,32,8,16,balanced,1.4138879776000977
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,32,16,8,power_law_1.01,0.04038400053977966
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,32,16,8,balanced,0.04958933095137278
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,32,16,8,power_law_1.01,0.04005120098590851
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,32,16,8,balanced,0.05835199852784475
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,32,16,8,power_law_1.01,0.04069119989871979
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,32,16,8,balanced,0.06158933540185293
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,32,16,8,power_law_1.01,0.04126079976558685
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,32,16,8,balanced,0.07657599945863088
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,32,16,8,power_law_1.01,0.04314880073070526
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,32,16,8,balanced,0.08595200379689534
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,32,16,8,power_law_1.01,0.04655359983444214
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,32,16,8,balanced,0.10891200105349223
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,32,16,8,power_law_1.01,0.052748799324035645
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,32,16,8,power_law_1.01,0.055270397663116456
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,32,16,8,balanced,0.1288746694723765
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,32,16,8,power_law_1.01,0.06945279836654664
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,32,16,8,power_law_1.01,0.07223039865493774
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,32,16,8,balanced,0.1725813349088033
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,32,16,8,power_law_1.01,0.08516479730606079
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,32,16,8,power_law_1.01,0.10154240131378174
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,32,16,8,balanced,0.21678932507832846
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,32,16,8,power_law_1.01,0.14446719884872436
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,32,16,8,power_law_1.01,0.1841215968132019
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,32,16,8,power_law_1.2,0.026572799682617186
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,32,16,8,power_law_1.01,0.25175039768218993
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,32,16,8,balanced,0.3190559943517049
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,32,16,8,power_law_1.2,0.026995199918746948
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,32,16,8,power_law_1.01,0.34561920166015625
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,32,16,8,power_law_1.2,0.026976001262664796
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,32,16,8,power_law_1.01,0.4719871997833252
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,32,16,8,power_law_1.2,0.02993279993534088
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,32,16,8,power_law_1.01,0.5901631832122802
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,32,16,8,power_law_1.2,0.03121280074119568
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,32,16,8,balanced,0.4073813358942668
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,32,16,8,power_law_1.2,0.03280639946460724
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,32,16,8,power_law_1.01,0.7627007961273193
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,32,32,4,balanced,0.02508266766866048
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,32,16,8,power_law_1.2,0.034720000624656674
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,32,16,8,power_law_1.01,1.154099178314209
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,32,32,4,balanced,0.027077332139015198
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,32,16,8,power_law_1.2,0.0353408008813858
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,32,16,8,power_law_1.01,2.2522048950195312
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,32,32,4,balanced,0.027503999571005504
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,32,16,8,power_law_1.2,0.04095360040664673
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,32,32,4,balanced,0.03124266614516576
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,32,16,8,balanced,0.5063733259836832
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,32,16,8,power_law_1.2,0.040627199411392215
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,32,32,4,balanced,0.031354665756225586
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,32,16,8,power_law_1.2,0.04059520065784454
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,32,32,4,balanced,0.03166399896144867
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,32,16,8,power_law_1.2,0.041580799221992495
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,32,32,4,balanced,0.03321066747109095
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,32,16,8,power_law_1.2,0.0423552006483078
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,32,32,4,balanced,0.03262399882078171
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,32,16,8,power_law_1.2,0.04386560022830963
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,32,32,4,balanced,0.03480533262093862
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,32,16,8,power_law_1.2,0.048793599009513855
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,32,32,4,balanced,0.034901333351929985
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,32,16,8,power_law_1.2,0.052934402227401735
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,32,16,8,balanced,0.7889813582102457
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,32,32,4,balanced,0.035562666753927864
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,32,16,8,power_law_1.2,0.05568640232086182
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,32,32,4,balanced,0.04186666508515676
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,32,16,8,power_law_1.2,0.07040640115737914
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,32,32,4,balanced,0.0428959975639979
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,32,16,8,power_law_1.2,0.07671679854393006
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,32,32,4,balanced,0.043178667624791466
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,32,32,4,power_law_1.01,0.026137599349021913
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,32,16,8,power_law_1.2,0.08856319785118102
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,32,32,4,balanced,0.04340800146261851
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,32,16,8,power_law_1.2,0.11108479499816895
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,32,32,4,power_law_1.01,0.02632960081100464
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,32,32,4,balanced,0.044639999667803444
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,32,16,8,power_law_1.2,0.15737600326538087
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,32,32,4,power_law_1.01,0.026752001047134398
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,32,32,4,balanced,0.04757333298524221
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,32,16,8,power_law_1.2,0.18078720569610596
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,32,32,4,power_law_1.01,0.029760000109672547
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,32,32,4,balanced,0.05541333556175232
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,32,16,8,power_law_1.2,0.2824320077896118
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,32,32,4,power_law_1.01,0.03075839877128601
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,32,32,4,balanced,0.05986666679382324
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,32,16,8,power_law_1.2,0.3867583990097046
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,32,32,4,power_law_1.01,0.03147520124912262
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,32,32,4,power_law_1.2,0.025900799036026
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,32,32,4,balanced,0.08083199958006541
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,32,16,8,power_law_1.2,0.5221951961517334
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,32,32,4,power_law_1.01,0.03243519961833954
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,32,32,4,power_law_1.2,0.026624000072479247
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,32,16,8,power_law_1.2,0.738316822052002
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,32,32,4,balanced,0.09139733513196309
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,32,32,4,power_law_1.2,0.026547199487686156
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,32,32,4,power_law_1.01,0.03226880133152008
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,32,16,8,balanced,1.550458590189616
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,32,32,4,power_law_1.2,0.02910720109939575
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,32,32,4,power_law_1.01,0.03498240113258362
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,32,16,8,power_law_1.2,0.9888192176818847
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,32,32,4,power_law_1.2,0.030668801069259642
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,32,32,4,balanced,0.11543466647466023
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,32,32,4,power_law_1.2,0.03115519881248474
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,32,32,4,power_law_1.01,0.03484799861907959
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,32,16,8,power_law_1.2,1.5135104179382324
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,32,32,4,power_law_1.2,0.03195520043373108
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,32,32,4,balanced,0.13750400145848593
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,32,32,4,power_law_1.01,0.036556801199913024
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,32,32,4,power_law_1.2,0.03269760012626648
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,32,16,8,power_law_1.2,3.0640703201293946
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,32,32,4,power_law_1.2,0.03468799889087677
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,32,32,4,power_law_1.01,0.04280959963798523
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,32,32,4,power_law_1.2,0.0353983998298645
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,32,32,4,balanced,0.18637865781784058
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,32,32,4,power_law_1.2,0.03573119938373566
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,32,32,4,power_law_1.01,0.04382080137729645
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,32,32,4,power_law_1.2,0.04284160137176514
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,32,32,4,power_law_1.01,0.0442111998796463
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,32,32,4,power_law_1.2,0.04360319972038269
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,32,32,4,balanced,0.23305066426595053
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,32,32,4,power_law_1.01,0.04620159864425659
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,32,32,4,power_law_1.2,0.0451200008392334
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,32,32,4,power_law_1.2,0.04643200039863586
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,32,32,4,power_law_1.01,0.04732159972190857
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,32,32,4,power_law_1.2,0.04855040013790131
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,4096,14336,2,8,32,8,balanced,0.029631999631722767
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,32,32,4,power_law_1.01,0.05187839865684509
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,32,32,4,power_law_1.2,0.052928000688552856
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,4096,14336,2,8,32,8,balanced,0.02945599953333537
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,32,32,4,power_law_1.2,0.0641215980052948
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,32,32,4,balanced,0.34443732102711994
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,32,32,4,power_law_1.01,0.0630400002002716
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,4096,14336,2,8,32,8,balanced,0.029493334392706554
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,32,32,4,power_law_1.2,0.0720255970954895
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,32,32,4,power_law_1.01,0.06997119784355163
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,32,32,4,power_law_1.2,0.08711040019989014
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,4096,14336,2,8,32,8,balanced,0.030458666384220123
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,32,32,4,power_law_1.2,0.1053056001663208
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,32,32,4,power_law_1.01,0.08997759819030762
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,4096,14336,2,8,32,8,balanced,0.031471999982992806
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,4096,14336,2,8,32,8,balanced,0.03047466774781545
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,32,32,4,power_law_1.2,0.13846399784088134
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,32,32,4,power_law_1.01,0.1058303952217102
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,4096,14336,2,8,32,8,balanced,0.03141866624355316
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,32,32,4,balanced,0.437610665957133
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,4096,14336,2,8,32,8,balanced,0.03068266560633977
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,32,32,4,power_law_1.2,0.18138240575790404
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,32,32,4,power_law_1.01,0.14041600227355958
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,32,32,4,power_law_1.2,0.27601280212402346
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,4096,14336,2,8,32,8,balanced,0.03169066707293192
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,4096,14336,2,8,32,8,balanced,0.03128000100453695
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,32,32,4,power_law_1.2,0.34497919082641604
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,32,32,4,power_law_1.01,0.160697603225708
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,4096,14336,2,8,32,8,balanced,0.0327360009153684
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,4096,14336,2,8,32,8,balanced,0.03585066646337509
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,32,32,4,power_law_1.2,0.5208127975463868
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,32,32,4,power_law_1.01,0.2481600046157837
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,4096,14336,2,8,32,8,balanced,0.033573334415753685
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,4096,14336,2,8,32,8,balanced,0.035887998839219414
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,32,32,4,power_law_1.2,0.7062592029571533
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,32,32,4,power_law_1.01,0.30032639503479003
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,4096,14336,2,8,32,8,balanced,0.03606399893760681
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,32,32,4,power_law_1.2,0.9764224052429199
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,4096,14336,2,8,32,8,balanced,0.033514666060606636
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,32,32,4,balanced,0.5497973362604777
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,32,32,4,power_law_1.01,0.47034878730773927
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,32,32,4,power_law_1.2,1.3355392456054687
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,4096,14336,2,8,32,8,balanced,0.03551466763019562
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,4096,14336,2,8,32,8,balanced,0.0335413341720899
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,4096,14336,2,8,32,8,balanced,0.03679466744263967
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,32,32,4,power_law_1.01,0.5469056129455566
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,32,32,4,power_law_1.2,2.682969665527344
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,4096,14336,2,8,32,8,balanced,0.034245334565639496
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,4096,14336,2,8,32,8,balanced,0.03734400123357773
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,4096,14336,2,8,32,8,balanced,0.03429333368937174
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,32,32,4,power_law_1.01,0.7494080066680908
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,4096,14336,2,8,32,8,balanced,0.03547733277082443
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,4096,14336,2,8,32,8,balanced,0.03979733337958654
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,32,32,4,power_law_1.01,1.0844799995422363
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,4096,14336,2,8,32,8,balanced,0.03504000107447306
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,4096,14336,2,8,32,8,balanced,0.04270400106906891
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,32,32,4,power_law_1.01,2.330803108215332
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,4096,14336,2,8,32,8,balanced,0.035242666800816856
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,4096,14336,2,8,32,8,balanced,0.043418665726979576
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,4096,14336,2,8,32,8,balanced,0.03602666656176249
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,32,32,4,balanced,0.8517119884490967
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,4096,14336,2,8,32,8,balanced,0.04248000184694926
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,4096,14336,2,8,32,8,balanced,0.036506667733192444
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,4096,14336,2,8,32,8,balanced,0.04422933359940847
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,4096,14336,2,8,32,8,balanced,0.040522667268911995
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,4096,14336,2,8,32,8,balanced,0.0443146675825119
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,4096,14336,2,8,32,8,balanced,0.0400693342089653
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,4096,14336,2,8,32,8,balanced,0.06065066655476888
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,4096,14336,2,8,32,8,balanced,0.04164800047874451
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,4096,14336,2,8,32,8,balanced,0.052832002441088356
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,4096,14336,2,8,32,8,balanced,0.04588800172011057
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,4096,14336,2,8,32,8,balanced,0.07301866511503856
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,4096,14336,2,8,32,8,balanced,0.04734399914741516
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,4096,14336,2,8,32,8,balanced,0.05925333499908447
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,4096,14336,2,8,32,8,balanced,0.06805333495140076
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,4096,14336,2,8,32,8,balanced,0.06592000027497609
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,4096,14336,2,8,32,8,balanced,0.10060266653696696
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,4096,14336,2,8,32,8,balanced,0.09133332967758179
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,4096,14336,2,8,32,8,balanced,0.10122133294741313
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,4096,14336,2,8,32,8,balanced,0.10008533795674641
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,32,32,4,balanced,1.6718826293945312
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,4096,14336,2,8,32,8,balanced,0.1390773355960846
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,4096,14336,2,8,32,8,balanced,0.14732266465822855
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,4096,14336,2,8,32,8,balanced,0.024869332710901897
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,4096,14336,2,8,32,8,balanced,0.16104533274968466
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,4096,14336,2,8,32,8,balanced,0.024832000335057575
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,4096,14336,2,8,32,8,balanced,0.17249067624409994
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,4096,14336,2,8,32,8,balanced,0.024842667082945507
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,4096,14336,2,8,32,8,balanced,0.22823466857274374
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,4096,14336,2,8,32,8,balanced,0.02619733413060506
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,4096,14336,2,8,32,8,balanced,0.027242665489514668
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,4096,14336,2,8,32,8,balanced,0.2351093292236328
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,4096,14336,2,8,32,8,balanced,0.027445333699385326
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,4096,14336,2,8,32,8,balanced,0.2850026686986287
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,4096,14336,2,8,32,8,balanced,0.027653334041436512
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,4096,14336,2,8,32,8,balanced,0.02740799884001414
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,4096,14336,2,8,32,8,balanced,0.02752533306678136
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,4096,14336,2,8,32,8,balanced,0.3606293201446533
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,4096,14336,2,8,32,8,balanced,0.31062932809193927
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,4096,14336,2,8,32,8,balanced,0.027962667246659596
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,4096,14336,2,8,32,8,balanced,0.02809600035349528
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,4096,14336,2,8,32,8,balanced,0.5287839968999227
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,4096,14336,2,8,32,8,balanced,0.028933333853880566
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,4096,14336,2,8,32,8,balanced,0.029696000119050343
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,4096,14336,2,8,32,8,power_law_1.01,0.02876160144805908
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,4096,14336,2,8,32,8,balanced,0.028362666567166645
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,4096,14336,2,8,32,8,balanced,0.5711413224538168
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,4096,14336,2,8,32,8,power_law_1.01,0.028729599714279175
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,4096,14336,2,8,32,8,power_law_1.01,0.028575998544692994
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,4096,14336,2,8,32,8,power_law_1.01,0.029785600304603577
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,4096,14336,2,8,32,8,power_law_1.01,0.029747200012207032
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,4096,14336,2,8,32,8,balanced,0.03473066786924998
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,4096,14336,2,8,32,8,balanced,1.0249333381652832
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,4096,14336,2,8,32,8,power_law_1.01,0.03950720131397247
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,4096,14336,2,8,32,8,balanced,0.03478399912516276
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,4096,14336,2,8,32,8,power_law_1.01,0.042156800627708435
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,4096,14336,2,8,32,8,balanced,0.03475199888149897
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,4096,14336,2,8,32,8,power_law_1.01,0.031206399202346802
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,4096,14336,2,8,32,8,power_law_1.01,0.03560959994792938
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,4096,14336,2,8,32,8,power_law_1.01,0.03136000037193298
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,4096,14336,2,8,32,8,power_law_1.01,0.036211198568344115
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,4096,14336,2,8,32,8,balanced,0.03939733405907949
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,4096,14336,2,8,32,8,power_law_1.01,0.03139199912548065
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,4096,14336,2,8,32,8,power_law_1.01,0.03689599931240082
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,4096,14336,2,8,32,8,balanced,0.04091733445723852
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,4096,14336,2,8,32,8,power_law_1.01,0.03273600041866302
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,4096,14336,2,8,32,8,power_law_1.01,0.0377344012260437
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,4096,14336,2,8,32,8,power_law_1.01,0.03325439989566803
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,4096,14336,2,8,32,8,power_law_1.01,0.038252800703048706
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,4096,14336,2,8,32,8,power_law_1.01,0.034067198634147644
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,4096,14336,2,8,32,8,power_law_1.01,0.03802880048751831
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,4096,14336,2,8,32,8,power_law_1.01,0.03420799970626831
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,4096,14336,2,8,32,8,power_law_1.01,0.04451839923858643
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,4096,14336,2,8,32,8,balanced,0.04800533254941305
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,4096,14336,2,8,32,8,power_law_1.01,0.03441280126571655
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,4096,14336,2,8,32,8,power_law_1.01,0.049932798743247984
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,4096,14336,2,8,32,8,power_law_1.01,0.03578880131244659
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,4096,14336,2,8,32,8,power_law_1.01,0.05160319805145264
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,4096,14336,2,8,32,8,power_law_1.01,0.057625597715377806
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,4096,14336,2,8,32,8,power_law_1.01,0.036211198568344115
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,4096,14336,2,8,32,8,power_law_1.01,0.06814720034599304
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,4096,14336,2,8,32,8,power_law_1.01,0.03739520013332367
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,4096,14336,2,8,32,8,balanced,0.05568000177542368
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,4096,14336,2,8,32,8,power_law_1.01,0.04012160003185272
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,4096,14336,2,8,32,8,power_law_1.01,0.0839680016040802
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,4096,14336,2,8,32,8,power_law_1.01,0.039392000436782836
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,4096,14336,2,8,32,8,power_law_1.01,0.1205631971359253
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,4096,14336,2,8,32,8,power_law_1.01,0.03925119936466217
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,4096,14336,2,8,32,8,power_law_1.01,0.0982208013534546
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,4096,14336,2,8,32,8,balanced,0.07020266850789388
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,4096,14336,2,8,32,8,power_law_1.01,0.045228800177574156
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,4096,14336,2,8,32,8,power_law_1.01,0.14596480131149292
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,4096,14336,2,8,32,8,power_law_1.01,0.04585599899291992
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,4096,14336,2,8,32,8,power_law_1.01,0.15633280277252198
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,4096,14336,2,8,32,8,power_law_1.01,0.024300800263881685
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,4096,14336,2,8,32,8,power_law_1.01,0.05378559827804565
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,4096,14336,2,8,32,8,power_law_1.01,0.22666239738464355
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,4096,14336,2,8,32,8,power_law_1.01,0.06277120113372803
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,4096,14336,2,8,32,8,power_law_1.01,0.024320000410079957
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,4096,14336,2,8,32,8,balanced,0.08362666765848796
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,4096,14336,2,8,32,8,power_law_1.01,0.25760641098022463
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,4096,14336,2,8,32,8,power_law_1.01,0.06670079827308655
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,4096,14336,2,8,32,8,power_law_1.01,0.024428799748420715
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,4096,14336,2,8,32,8,power_law_1.01,0.3528575897216797
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,4096,14336,2,8,32,8,power_law_1.01,0.0905344009399414
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,4096,14336,2,8,32,8,power_law_1.2,0.028774398565292358
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,4096,14336,2,8,32,8,power_law_1.01,0.025971201062202454
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,4096,14336,2,8,32,8,power_law_1.01,0.46967039108276365
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,4096,14336,2,8,32,8,power_law_1.01,0.10435839891433715
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,4096,14336,2,8,32,8,power_law_1.01,0.02640640139579773
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,4096,14336,2,8,32,8,power_law_1.2,0.02871040105819702
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,4096,14336,2,8,32,8,power_law_1.01,0.6109568119049072
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,4096,14336,2,8,32,8,power_law_1.2,0.02874239981174469
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,4096,14336,2,8,32,8,balanced,0.11436800161997478
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,4096,14336,2,8,32,8,power_law_1.01,0.14024319648742675
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,4096,14336,2,8,32,8,power_law_1.01,0.02688640058040619
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,4096,14336,2,8,32,8,power_law_1.2,0.029657599329948426
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,4096,14336,2,8,32,8,power_law_1.01,0.9497535705566407
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,4096,14336,2,8,32,8,power_law_1.2,0.02996479868888855
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,4096,14336,2,8,32,8,power_law_1.01,0.16312960386276246
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,4096,14336,2,8,32,8,power_law_1.01,0.027635198831558228
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,4096,14336,2,8,32,8,power_law_1.2,0.037785598635673524
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,4096,14336,2,8,32,8,power_law_1.01,0.2295680046081543
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,4096,14336,2,8,32,8,power_law_1.01,1.6909887313842773
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,4096,14336,2,8,32,8,power_law_1.01,0.02794240117073059
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,4096,14336,2,8,32,8,power_law_1.2,0.04562560021877289
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,4096,14336,2,8,32,8,power_law_1.2,0.03550080060958862
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,4096,14336,2,8,32,8,power_law_1.01,0.273305606842041
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,4096,14336,2,8,32,8,power_law_1.01,0.02869119942188263
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,4096,14336,2,8,32,8,power_law_1.2,0.03578239977359772
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,4096,14336,2,8,32,8,power_law_1.01,0.4163008213043213
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,4096,14336,2,8,32,8,power_law_1.2,0.03687039911746979
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,4096,14336,2,8,32,8,balanced,0.13769066333770752
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,4096,14336,2,8,32,8,power_law_1.01,0.029017600417137145
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,4096,14336,2,8,32,8,power_law_1.2,0.03729279935359955
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,4096,14336,2,8,32,8,power_law_1.01,0.5233791828155517
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,4096,14336,2,8,32,8,power_law_1.2,0.03901439905166626
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,4096,14336,2,8,32,8,power_law_1.01,0.68755202293396
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,4096,14336,2,8,32,8,power_law_1.2,0.0383103996515274
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,4096,14336,2,8,32,8,balanced,0.21341866254806519
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,4096,14336,2,8,32,8,power_law_1.2,0.043161600828170776
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,4096,14336,2,8,32,8,power_law_1.01,0.9533696174621582
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,4096,14336,2,8,32,8,power_law_1.01,0.03061760067939758
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,4096,14336,2,8,32,8,power_law_1.2,0.048979198932647704
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,4096,14336,2,8,32,8,power_law_1.01,1.9779136657714844
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,4096,14336,2,8,32,8,power_law_1.2,0.04971520006656647
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,4096,14336,2,8,32,8,power_law_1.01,0.033766400814056394
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,4096,14336,2,8,32,8,balanced,0.2760853370030721
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,4096,14336,2,8,32,8,power_law_1.2,0.05761920213699341
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,4096,14336,2,8,32,8,power_law_1.01,0.03842560052871704
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,4096,14336,2,8,32,8,power_law_1.2,0.07416319847106934
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,4096,14336,2,8,32,8,power_law_1.2,0.08486400246620178
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,4096,14336,2,8,32,8,power_law_1.01,0.03997440040111542
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,4096,14336,2,8,32,8,power_law_1.2,0.12101759910583496
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,4096,14336,2,8,32,8,power_law_1.2,0.11016960144042968
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,4096,14336,2,8,32,8,power_law_1.2,0.14403200149536133
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,4096,14336,2,8,32,8,power_law_1.2,0.15123840570449829
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,4096,14336,2,8,32,8,power_law_1.01,0.04523519873619079
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,4096,14336,2,8,32,8,power_law_1.2,0.22184960842132567
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,4096,14336,2,8,32,8,balanced,0.3455466826756795
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,4096,14336,2,8,32,8,power_law_1.2,0.03121280074119568
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,4096,14336,2,8,32,8,power_law_1.2,0.23633921146392822
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,4096,14336,2,8,32,8,power_law_1.01,0.047993600368499756
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,4096,14336,2,8,32,8,power_law_1.2,0.36039679050445556
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,4096,14336,2,8,32,8,power_law_1.01,0.0531711995601654
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,4096,14336,2,8,32,8,power_law_1.2,0.031327998638153075
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,4096,14336,2,8,32,8,power_law_1.2,0.49271039962768554
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,4096,14336,2,8,32,8,power_law_1.2,0.6031744003295898
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,4096,14336,2,8,32,8,power_law_1.2,0.03142400085926056
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,4096,14336,2,8,32,8,power_law_1.2,0.9601792335510254
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,4096,14336,2,8,32,8,power_law_1.01,0.0650816023349762
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,4096,14336,2,8,32,8,balanced,0.5261546770731608
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,4096,14336,2,8,32,8,power_law_1.2,0.032646399736404416
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,4096,14336,2,8,32,8,power_law_1.2,1.4685376167297364
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,4096,14336,2,8,32,8,power_law_1.01,0.07765759825706482
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,4096,14336,2,8,32,8,power_law_1.2,0.033011201024055484
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,4096,14336,2,8,32,8,power_law_1.2,0.03380480110645294
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,4096,14336,2,8,32,8,power_law_1.2,0.03420799970626831
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,4096,14336,2,8,32,8,power_law_1.01,0.09923200011253357
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,4096,14336,2,8,32,8,power_law_1.2,0.03418239951133728
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,4096,14336,2,8,32,8,power_law_1.2,0.035334399342536925
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,4096,14336,2,8,32,8,power_law_1.2,0.03537279963493347
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,4096,14336,2,8,32,8,power_law_1.01,0.11909120082855225
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,4096,14336,2,8,32,8,power_law_1.2,0.03768320083618164
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,4096,14336,2,8,32,8,balanced,1.014895995457967
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,4096,14336,2,8,32,8,power_law_1.2,0.04123519957065582
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,4096,14336,2,8,32,8,power_law_1.01,0.17122559547424315
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,4096,14336,2,8,32,8,power_law_1.2,0.038975998759269714
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,4096,14336,2,8,32,8,power_law_1.2,0.039417600631713866
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,4096,14336,2,8,32,8,power_law_1.01,0.2249664068222046
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,4096,14336,2,8,32,8,power_law_1.2,0.04552960097789764
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,4096,14336,2,8,32,8,power_law_1.01,0.3428992033004761
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,4096,14336,2,8,32,8,power_law_1.2,0.04535039961338043
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,4096,14336,2,8,32,8,power_law_1.2,0.02439039945602417
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,4096,14336,2,8,32,8,power_law_1.2,0.05156480073928833
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,4096,14336,2,8,32,8,power_law_1.2,0.024428799748420715
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,4096,14336,2,8,32,8,power_law_1.01,0.4250175952911377
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,4096,14336,2,8,32,8,power_law_1.2,0.0615231990814209
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,4096,14336,2,8,32,8,power_law_1.2,0.024742400646209715
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,4096,14336,2,8,32,8,power_law_1.01,0.6873472213745118
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,6144,16384,2,8,32,8,balanced,0.036714665591716766
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,4096,14336,2,8,32,8,power_law_1.2,0.06598399877548218
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,4096,14336,2,8,32,8,power_law_1.2,0.026169601082801818
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,4096,14336,2,8,32,8,power_law_1.01,0.8575872421264649
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,4096,14336,2,8,32,8,power_law_1.2,0.08613119721412658
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,4096,14336,2,8,32,8,power_law_1.2,0.02696320116519928
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,6144,16384,2,8,32,8,balanced,0.036943999429543815
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,6144,16384,2,8,32,8,balanced,0.03700799991687139
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,4096,14336,2,8,32,8,power_law_1.2,0.026918399333953857
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,4096,14336,2,8,32,8,power_law_1.2,0.10703999996185302
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,4096,14336,2,8,32,8,power_law_1.01,1.0423359870910645
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,6144,16384,2,8,32,8,balanced,0.03775999943415324
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,4096,14336,2,8,32,8,power_law_1.2,0.027456000447273254
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,4096,14336,2,8,32,8,power_law_1.2,0.13960319757461548
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,4096,14336,2,8,32,8,power_law_1.01,1.611974334716797
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,6144,16384,2,8,32,8,balanced,0.03774400055408478
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,4096,14336,2,8,32,8,power_law_1.2,0.027980801463127137
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,4096,14336,2,8,32,8,power_law_1.2,0.1643839955329895
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,6144,16384,2,8,32,8,balanced,0.04111466556787491
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,4096,14336,2,8,32,8,power_law_1.2,0.02892799973487854
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,4096,14336,2,8,32,8,power_law_1.01,3.235532760620117
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,4096,14336,2,8,32,8,power_law_1.2,0.23458559513092042
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,4096,14336,2,8,32,8,power_law_1.2,0.02953599989414215
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,6144,16384,2,8,32,8,balanced,0.04231466849644979
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,4096,14336,2,8,32,8,power_law_1.2,0.2859391927719116
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,6144,16384,2,8,32,8,balanced,0.041840001940727234
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,4096,14336,2,8,32,8,power_law_1.2,0.40874881744384767
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,6144,16384,2,8,32,8,balanced,0.04218666752179464
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,4096,14336,2,8,32,8,power_law_1.2,0.029100799560546876
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,4096,14336,2,8,32,8,power_law_1.2,0.5199168205261231
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,6144,16384,2,8,32,8,balanced,0.04214933514595032
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,4096,14336,2,8,32,8,power_law_1.2,0.03470079898834229
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,6144,16384,2,8,32,8,balanced,0.042026668787002563
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,4096,14336,2,8,32,8,power_law_1.2,0.6863808155059814
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,4096,14336,2,8,32,8,power_law_1.2,0.03656319975852966
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,6144,16384,2,8,32,8,balanced,0.04350399971008301
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,4096,14336,2,8,32,8,power_law_1.2,0.04097279906272888
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,4096,14336,2,8,32,8,power_law_1.2,1.0520383834838867
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,6144,16384,2,8,32,8,balanced,0.043840001026789345
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,4096,14336,2,8,32,8,power_law_1.2,1.8653568267822265
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,6144,16384,2,8,32,8,balanced,0.0432586669921875
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,4096,14336,2,8,32,8,power_law_1.2,0.04872319996356964
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,6144,16384,2,8,32,8,balanced,0.04872000217437744
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,4096,14336,2,8,32,8,power_law_1.2,0.04898560047149658
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,6144,16384,2,8,32,8,balanced,0.04948266843954722
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,4096,14336,2,8,32,8,power_law_1.2,0.05443199872970581
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,6144,16384,2,8,32,8,balanced,0.05049066742261251
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,4096,14336,2,8,32,8,power_law_1.2,0.0686016023159027
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,6144,16384,2,8,32,8,balanced,0.05657599866390228
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,4096,14336,2,8,32,8,power_law_1.2,0.08052480220794678
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,6144,16384,2,8,32,8,balanced,0.05541333556175232
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,6144,16384,2,8,32,8,balanced,0.0640533318122228
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,4096,14336,2,8,32,8,power_law_1.2,0.110316801071167
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,6144,16384,2,8,32,8,balanced,0.06864533325036366
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,6144,16384,2,8,32,8,balanced,0.084389328956604
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,4096,14336,2,8,32,8,power_law_1.2,0.1175104022026062
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,6144,16384,2,8,32,8,balanced,0.08985599875450134
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,6144,16384,2,8,32,8,balanced,0.034714666505654655
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,6144,16384,2,8,32,8,balanced,0.13025599718093872
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,4096,14336,2,8,32,8,power_law_1.2,0.17990399599075318
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,6144,16384,2,8,32,8,balanced,0.03497066597143809
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,6144,16384,2,8,32,8,balanced,0.035018667578697205
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,6144,16384,2,8,32,8,balanced,0.13569066921869913
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,4096,14336,2,8,32,8,power_law_1.2,0.2153791904449463
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,6144,16384,2,8,32,8,balanced,0.03589333345492681
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,6144,16384,2,8,32,8,balanced,0.03687999894221624
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,4096,14336,2,8,32,8,power_law_1.2,0.3548671960830688
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,6144,16384,2,8,32,8,balanced,0.20706667502721152
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,6144,16384,2,8,32,8,balanced,0.03679466744263967
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,6144,16384,2,8,32,8,balanced,0.037903999288876854
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,4096,14336,2,8,32,8,power_law_1.2,0.4135744094848633
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,6144,16384,2,8,32,8,balanced,0.2367253303527832
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,6144,16384,2,8,32,8,balanced,0.03714666763941447
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,4096,14336,2,8,32,8,power_law_1.2,0.6881792068481445
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,6144,16384,2,8,32,8,balanced,0.03766400118668874
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,4096,14336,2,8,32,8,power_law_1.2,0.8337087631225586
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,6144,16384,2,8,32,8,balanced,0.03815466662247976
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,6144,16384,2,8,32,8,balanced,0.33460799853007
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,6144,16384,2,8,32,8,balanced,0.03882133215665817
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,4096,14336,2,8,32,8,power_law_1.2,1.0823871612548828
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,6144,16384,2,8,32,8,balanced,0.03880000114440918
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,4096,14336,2,8,32,8,power_law_1.2,1.5764736175537108
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,6144,16384,2,8,32,8,balanced,0.03958400090535482
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,4096,14336,2,8,32,8,power_law_1.2,3.342803192138672
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,6144,16384,2,8,32,8,balanced,0.04011733333269755
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,6144,16384,2,8,32,8,balanced,0.045381332437197365
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,6144,16384,2,8,32,8,balanced,0.43999465306599933
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,6144,16384,2,8,32,8,power_law_1.01,0.035820800065994265
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,6144,16384,2,8,32,8,balanced,0.045610666275024414
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,6144,16384,2,8,32,8,balanced,0.027930667002995808
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,6144,16384,2,8,32,8,balanced,0.04715733230113983
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,6144,16384,2,8,32,8,balanced,0.02812800059715907
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,6144,16384,2,8,32,8,power_law_1.01,0.03576320111751556
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,6144,16384,2,8,32,8,balanced,0.028090665737787884
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,6144,16384,2,8,32,8,balanced,0.05402666827042898
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,6144,16384,2,8,32,8,power_law_1.01,0.03597440123558045
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,6144,16384,2,8,32,8,balanced,0.029509333272775013
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,6144,16384,2,8,32,8,power_law_1.01,0.03687039911746979
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,6144,16384,2,8,32,8,balanced,0.061717331409454346
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,6144,16384,2,8,32,8,balanced,0.03046400099992752
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,6144,16384,2,8,32,8,power_law_1.01,0.03736959993839264
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,6144,16384,2,8,32,8,balanced,0.07765866816043854
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,6144,16384,2,8,32,8,balanced,0.030693332354227703
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,6144,16384,2,8,32,8,power_law_1.01,0.04686079919338226
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,6144,16384,2,8,32,8,balanced,0.0867680013179779
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,6144,16384,2,8,32,8,balanced,0.8368106683095297
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,6144,16384,2,8,32,8,power_law_1.01,0.03418239951133728
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,6144,16384,2,8,32,8,balanced,0.03107200066248576
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,6144,16384,2,8,32,8,power_law_1.01,0.0574783980846405
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,6144,16384,2,8,32,8,balanced,0.1123466690381368
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,6144,16384,2,8,32,8,power_law_1.01,0.03433600068092346
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,6144,16384,2,8,32,8,balanced,0.030720000465710957
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,6144,16384,2,8,32,8,power_law_1.01,0.04314880073070526
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,6144,16384,2,8,32,8,power_law_1.01,0.034483200311660765
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,6144,16384,2,8,32,8,balanced,0.13011200229326883
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,6144,16384,2,8,32,8,balanced,0.031034665803114574
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,6144,16384,2,8,32,8,power_law_1.01,0.04298880100250244
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,6144,16384,2,8,32,8,power_law_1.01,0.03596160113811493
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,6144,16384,2,8,32,8,balanced,0.03202133377393087
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,6144,16384,2,8,32,8,power_law_1.01,0.042796799540519716
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,6144,16384,2,8,32,8,balanced,0.1827253301938375
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,6144,16384,2,8,32,8,power_law_1.01,0.03617919981479645
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,6144,16384,2,8,32,8,power_law_1.01,0.045286399126052854
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,6144,16384,2,8,32,8,power_law_1.01,0.03670400083065033
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,6144,16384,2,8,32,8,power_law_1.01,0.0466048002243042
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,6144,16384,2,8,32,8,balanced,0.21606399615605673
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,6144,16384,2,8,32,8,power_law_1.01,0.03776000142097473
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,6144,16384,2,8,32,8,power_law_1.01,0.049395200610160825
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,6144,16384,2,8,32,8,power_law_1.01,0.03823359906673431
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,6144,16384,2,8,32,8,balanced,0.03136533250411352
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,6144,16384,2,8,32,8,power_law_1.01,0.04809600114822388
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,6144,16384,2,8,32,8,balanced,0.316106657187144
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,6144,16384,2,8,32,8,power_law_1.01,0.03951359987258911
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,6144,16384,2,8,32,8,balanced,0.031632001201311745
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,6144,16384,2,8,32,8,power_law_1.01,0.06002560257911682
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,6144,16384,2,8,32,8,power_law_1.01,0.040275201201438904
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,6144,16384,2,8,32,8,balanced,0.033157333731651306
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,6144,16384,2,8,32,8,power_law_1.01,0.07337599992752075
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,6144,16384,2,8,32,8,balanced,0.3917813301086426
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,6144,16384,2,8,32,8,power_law_1.01,0.04232960045337677
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,6144,16384,2,8,32,8,balanced,0.03165333221356074
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,6144,16384,2,8,32,8,power_law_1.01,0.0794431984424591
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,6144,16384,2,8,32,8,power_law_1.01,0.04391680061817169
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,6144,16384,2,8,32,8,power_law_1.01,0.11039999723434449
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,6144,16384,2,8,32,8,power_law_1.01,0.042982399463653564
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,6144,16384,2,8,32,8,balanced,0.5049973328908285
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,6144,16384,2,8,32,8,power_law_1.01,0.09086719751358033
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,6144,16384,2,8,32,8,power_law_1.01,0.046086400747299194
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,6144,16384,2,8,32,8,power_law_1.01,0.050310397148132326
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,6144,16384,2,8,32,8,power_law_1.01,0.11535999774932862
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,6144,16384,2,8,32,8,balanced,0.0386613334218661
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,6144,16384,2,8,32,8,power_law_1.01,0.052774399518966675
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,6144,16384,2,8,32,8,power_law_1.01,0.11790080070495605
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,6144,16384,2,8,32,8,balanced,0.03941333293914795
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,6144,16384,2,8,32,8,power_law_1.01,0.05815039873123169
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,6144,16384,2,8,32,8,power_law_1.01,0.1715456008911133
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,6144,16384,2,8,32,8,balanced,0.03957333415746689
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,6144,16384,2,8,32,8,power_law_1.01,0.027327999472618103
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,6144,16384,2,8,32,8,balanced,0.7463146845499674
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,6144,16384,2,8,32,8,power_law_1.01,0.0725823998451233
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,6144,16384,2,8,32,8,power_law_1.01,0.21889920234680177
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,6144,16384,2,8,32,8,power_law_1.01,0.02757120132446289
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,6144,16384,2,8,32,8,power_law_1.01,0.08568320274353028
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,6144,16384,2,8,32,8,power_law_1.01,0.3030656099319458
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,6144,16384,2,8,32,8,power_law_1.01,0.027884799242019653
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,6144,16384,2,8,32,8,power_law_1.01,0.11662720441818238
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,6144,16384,2,8,32,8,power_law_1.01,0.029254400730133058
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,6144,16384,2,8,32,8,power_law_1.01,0.37166080474853513
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,6144,16384,2,8,32,8,balanced,0.046037331223487854
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,6144,16384,2,8,32,8,power_law_1.01,0.029747200012207032
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,6144,16384,2,8,32,8,power_law_1.01,0.12282240390777588
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,6144,16384,2,8,32,8,power_law_1.01,0.47287678718566895
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,6144,16384,2,8,32,8,balanced,0.051183998584747314
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,6144,16384,2,8,32,8,power_law_1.01,0.03027839958667755
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,6144,16384,2,8,32,8,power_law_1.2,0.036108800768852235
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,6144,16384,2,8,32,8,power_law_1.01,0.1702911972999573
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,6144,16384,2,8,32,8,power_law_1.01,0.6360320091247559
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,6144,16384,2,8,32,8,power_law_1.01,0.03216640055179596
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,6144,16384,2,8,32,8,power_law_1.01,0.21791999340057372
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,6144,16384,2,8,32,8,power_law_1.2,0.0359935998916626
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,6144,16384,2,8,32,8,power_law_1.01,0.03249920010566711
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,6144,16384,2,8,32,8,power_law_1.01,0.8848832130432129
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,6144,16384,2,8,32,8,power_law_1.01,0.03357439935207367
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,6144,16384,2,8,32,8,power_law_1.01,0.33199999332427976
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,6144,16384,2,8,32,8,power_law_1.2,0.03654400110244751
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,6144,16384,2,8,32,8,balanced,1.4703787167867024
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,6144,16384,2,8,32,8,power_law_1.01,1.4605888366699218
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,6144,16384,2,8,32,8,power_law_1.01,0.034995201230049136
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,6144,16384,2,8,32,8,power_law_1.01,0.3699392080307007
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,6144,16384,2,8,32,8,balanced,0.06250133117039998
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,6144,16384,2,8,32,8,power_law_1.2,0.038841599225997926
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,6144,16384,2,8,32,8,power_law_1.01,0.5579775810241699
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,6144,16384,2,8,32,8,power_law_1.01,2.6170560836791994
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,6144,16384,2,8,32,8,power_law_1.2,0.037785598635673524
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,6144,16384,2,8,32,8,power_law_1.01,0.033855998516082765
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,6144,16384,2,8,32,8,power_law_1.01,0.7639808177947998
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,6144,16384,2,8,32,8,balanced,0.07047999898592631
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,6144,16384,2,8,32,8,power_law_1.01,0.04026240110397339
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,6144,16384,2,8,32,8,power_law_1.2,0.05607680082321167
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,6144,16384,2,8,32,8,power_law_1.01,0.9010111808776855
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,6144,16384,2,8,32,8,power_law_1.01,0.04249599874019623
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,6144,16384,2,8,32,8,power_law_1.2,0.05808640122413635
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,6144,16384,2,8,32,8,power_law_1.01,0.04497919976711273
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,6144,16384,2,8,32,8,power_law_1.01,1.5252991676330567
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,6144,16384,2,8,32,8,power_law_1.2,0.04296959936618805
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,6144,16384,2,8,32,8,power_law_1.01,2.589753532409668
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,6144,16384,2,8,32,8,balanced,0.09091732899347942
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,6144,16384,2,8,32,8,power_law_1.01,0.052102398872375486
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,6144,16384,2,8,32,8,power_law_1.2,0.04287999868392944
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,6144,16384,2,8,32,8,power_law_1.01,0.05675519704818725
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,6144,16384,2,8,32,8,power_law_1.2,0.043347200751304625
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,6144,16384,2,8,32,8,power_law_1.01,0.0664192020893097
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,6144,16384,2,8,32,8,power_law_1.2,0.04577920138835907
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,6144,16384,2,8,32,8,balanced,0.1081813375155131
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,6144,16384,2,8,32,8,power_law_1.01,0.08448640108108521
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,6144,16384,2,8,32,8,power_law_1.2,0.046367999911308286
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,6144,16384,2,8,32,8,power_law_1.01,0.11221760511398315
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,6144,16384,2,8,32,8,power_law_1.2,0.049516800045967105
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,6144,16384,2,8,32,8,power_law_1.01,0.1404096007347107
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,6144,16384,2,8,32,8,power_law_1.2,0.047705599665641786
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,6144,16384,2,8,32,8,power_law_1.2,0.07119359970092773
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,6144,16384,2,8,32,8,power_law_1.01,0.18224639892578126
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,6144,16384,2,8,32,8,balanced,0.15109866857528687
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,6144,16384,2,8,32,8,power_law_1.2,0.07308800220489502
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,6144,16384,2,8,32,8,power_law_1.01,0.257804799079895
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,6144,16384,2,8,32,8,power_law_1.2,0.07895039916038513
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,6144,16384,2,8,32,8,balanced,0.1946986714998881
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,6144,16384,2,8,32,8,power_law_1.2,0.1044927954673767
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,6144,16384,2,8,32,8,power_law_1.01,0.30193281173706055
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,6144,16384,2,8,32,8,power_law_1.2,0.09114879965782166
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,6144,16384,2,8,32,8,balanced,0.3065813382466634
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,6144,16384,2,8,32,8,power_law_1.2,0.12092800140380859
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,6144,16384,2,8,32,8,power_law_1.01,0.4799808025360107
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,6144,16384,2,8,32,8,power_law_1.2,0.11543040275573731
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,6144,16384,2,8,32,8,power_law_1.01,0.5935423851013184
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,6144,16384,2,8,32,8,power_law_1.2,0.1771775960922241
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,6144,16384,2,8,32,8,power_law_1.01,0.8933247566223145
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,6144,16384,2,8,32,8,balanced,0.38307201862335205
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,6144,16384,2,8,32,8,power_law_1.2,0.23144960403442383
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,6144,16384,2,8,32,8,power_law_1.01,1.1593728065490723
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,6144,16384,2,8,32,8,power_law_1.2,0.3473599910736084
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,6144,16384,2,8,32,8,power_law_1.2,0.3674367904663086
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,6144,16384,2,8,32,8,power_law_1.2,0.48679041862487793
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,6144,16384,2,8,32,8,power_law_1.2,0.03415040075778961
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,6144,16384,2,8,32,8,power_law_1.01,1.528121566772461
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,6144,16384,2,8,32,8,balanced,0.48635733127593994
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,6144,16384,2,8,32,8,power_law_1.2,0.7218944072723389
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,6144,16384,2,8,32,8,power_law_1.01,2.3552576065063477
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,6144,16384,2,8,32,8,power_law_1.2,0.03463680148124695
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,6144,16384,2,8,32,8,power_law_1.01,4.5469825744628904
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,6144,16384,2,8,32,8,power_law_1.2,0.9131648063659668
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,6144,16384,2,8,32,8,power_law_1.2,0.03454079926013946
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,6144,16384,2,8,32,8,power_law_1.2,1.46048002243042
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,6144,16384,2,8,32,8,power_law_1.2,0.035750401020050046
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,6144,16384,2,8,32,8,power_law_1.2,0.0361407995223999
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,6144,16384,2,8,32,8,power_law_1.2,2.6141504287719726
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,6144,16384,2,8,32,8,balanced,0.7363999684651693
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,6144,16384,2,8,32,8,power_law_1.2,0.036550399661064145
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,6144,16384,2,8,32,8,power_law_1.2,0.03815680146217346
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,6144,16384,2,8,32,8,power_law_1.2,0.03877759873867035
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,6144,16384,2,8,32,8,power_law_1.2,0.039289599657058714
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,6144,16384,2,8,32,8,power_law_1.2,0.039955198764801025
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,6144,16384,2,8,32,8,power_law_1.2,0.027347201108932497
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,6144,16384,2,8,32,8,power_law_1.2,0.04299519956111908
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,6144,16384,2,8,32,8,power_law_1.2,0.027692800760269164
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,6144,16384,2,8,32,8,power_law_1.2,0.04311679899692535
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,6144,16384,2,8,32,8,balanced,1.4366827011108398
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,6144,16384,2,8,32,8,power_law_1.2,0.04344319999217987
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,6144,16384,2,8,32,8,power_law_1.2,0.027801600098609925
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,6144,16384,2,8,32,8,power_law_1.2,0.04547199904918671
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,6144,16384,2,8,32,8,power_law_1.2,0.029369598627090453
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,6144,16384,2,8,32,8,power_law_1.2,0.05123199820518494
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,6144,16384,2,8,32,8,power_law_1.2,0.029747200012207032
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,6144,16384,2,8,32,8,power_law_1.2,0.05309439897537231
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,6144,16384,2,8,32,8,power_law_1.2,0.030131199955940248
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,6144,16384,2,8,32,8,power_law_1.2,0.057094401121139525
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,6144,16384,2,8,32,8,power_law_1.2,0.03294720053672791
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,6144,16384,2,8,32,8,power_law_1.2,0.07686399817466735
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,6144,16384,2,8,32,8,power_law_1.2,0.03296639919281006
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,6144,16384,2,8,32,8,power_law_1.2,0.08796160221099854
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,6144,16384,2,8,32,8,power_law_1.2,0.033843201398849485
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,6144,16384,2,8,32,8,power_law_1.2,0.11723519563674926
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,6144,16384,2,8,32,8,power_law_1.2,0.034944000840187076
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,6144,16384,2,8,32,8,power_law_1.2,0.12438399791717529
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,6144,16384,2,8,32,8,power_law_1.2,0.17164160013198854
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,6144,16384,2,8,32,8,power_law_1.2,0.03472639918327332
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,6144,16384,2,8,32,8,power_law_1.2,0.2207103967666626
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,6144,16384,2,8,32,8,power_law_1.2,0.04116480052471161
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,6144,16384,2,8,32,8,power_law_1.2,0.3305919885635376
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,6144,16384,2,8,32,8,power_law_1.2,0.04317440092563629
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,6144,16384,2,8,32,8,power_law_1.2,0.3870464086532593
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,6144,16384,2,8,32,8,power_law_1.2,0.0500927984714508
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,6144,16384,2,8,32,8,power_law_1.2,0.5615615844726562
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,6144,16384,2,8,32,8,power_law_1.2,0.7553279876708985
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,6144,16384,2,8,32,8,power_law_1.2,0.9066240310668945
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,6144,16384,2,8,32,8,power_law_1.2,0.05203840136528015
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,6144,16384,2,8,32,8,power_law_1.2,1.4581312179565429
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,6144,16384,2,8,32,8,power_law_1.2,0.05725439786911011
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,6144,16384,2,8,32,8,power_law_1.2,0.06651520133018493
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,6144,16384,2,8,32,8,power_law_1.2,2.732524871826172
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,6144,16384,2,8,32,8,power_law_1.2,0.08956159949302674
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,6144,16384,2,8,32,8,power_law_1.2,0.10334080457687378
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,6144,16384,2,8,32,8,power_law_1.2,0.1472640037536621
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,6144,16384,2,8,32,8,power_law_1.2,0.1879807949066162
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,6144,16384,2,8,32,8,power_law_1.2,0.26358399391174314
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,6144,16384,2,8,32,8,power_law_1.2,0.3098367929458618
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,6144,16384,2,8,32,8,power_law_1.2,0.49429759979248045
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,6144,16384,2,8,32,8,power_law_1.2,0.620192003250122
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,6144,16384,2,8,32,8,power_law_1.2,0.9381504058837891
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,6144,16384,2,8,32,8,power_law_1.2,1.2252863883972167
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,6144,16384,2,8,32,8,power_law_1.2,1.5432064056396484
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,7168,2048,8,256,1,256,balanced,0.19242133696873984
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,7168,2048,8,256,1,256,balanced,0.11654399832089742
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,6144,16384,2,8,32,8,power_law_1.2,2.2954816818237305
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,7168,2048,8,256,1,256,balanced,0.19054933389027914
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,7168,2048,8,256,1,256,balanced,0.11534933249155681
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,7168,2048,8,256,1,256,balanced,0.19063466787338257
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,6144,16384,2,8,32,8,power_law_1.2,4.531872177124024
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,7168,2048,8,256,1,256,balanced,0.11823466420173645
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,7168,2048,8,256,1,256,balanced,0.2003893256187439
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,7168,2048,8,256,1,256,balanced,0.1197760005791982
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,7168,2048,8,256,1,256,balanced,0.2030506730079651
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,7168,2048,8,256,1,256,balanced,0.11575466394424438
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,7168,2048,8,256,1,256,balanced,0.1957706610361735
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,7168,2048,8,256,1,256,balanced,0.11649066209793091
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,7168,2048,8,256,1,256,balanced,0.19912532965342203
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,7168,2048,8,256,1,256,balanced,0.12064533432324727
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,7168,2048,8,256,1,256,balanced,0.19977599382400513
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,7168,2048,8,256,1,256,balanced,0.1267306705315908
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,7168,2048,8,256,1,256,balanced,0.1936639944712321
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,7168,2048,8,256,1,256,balanced,0.12599466244379678
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,7168,2048,8,256,1,256,balanced,0.1930346687634786
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,7168,2048,8,256,1,256,balanced,0.1272693375746409
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,7168,2048,8,256,1,256,balanced,0.19618133703867593
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,7168,2048,8,256,1,256,balanced,0.119759996732076
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,7168,2048,8,256,1,256,balanced,0.20018666982650757
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,7168,2048,8,256,1,256,balanced,0.13144532839457193
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,7168,2048,8,256,1,256,balanced,0.12863467137018839
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,7168,2048,8,256,1,256,balanced,0.1927786668141683
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,7168,2048,8,256,1,256,balanced,0.048325334986050926
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,7168,2048,8,256,1,256,balanced,0.12461866935094197
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,7168,2048,8,256,1,256,balanced,0.1852746605873108
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,7168,2048,8,256,1,256,balanced,0.13486933708190918
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,7168,2048,8,256,1,256,balanced,0.04735999802748362
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,7168,2048,8,256,1,256,balanced,0.1986186703046163
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,7168,2048,8,256,1,256,balanced,0.04839999973773956
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,7168,2048,8,256,1,256,balanced,0.13130133350690207
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,7168,2048,8,256,1,256,balanced,0.05403199791908264
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,7168,2048,8,256,1,256,balanced,0.19780266284942627
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,7168,2048,8,256,1,256,balanced,0.13281066219011942
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,7168,2048,8,256,1,256,balanced,0.05268799761931101
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,7168,2048,8,256,1,256,balanced,0.05305600166320801
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,7168,2048,8,256,1,256,balanced,0.1902559995651245
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,7168,2048,8,256,1,256,balanced,0.14191466569900513
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,7168,2048,8,256,1,256,balanced,0.0544106662273407
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,7168,2048,8,256,1,256,balanced,0.055162668228149414
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,7168,2048,8,256,1,256,balanced,0.20148799816767374
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,7168,2048,8,256,1,256,balanced,0.150218665599823
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,7168,2048,8,256,1,256,balanced,0.05515199899673462
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,7168,2048,8,256,1,256,balanced,0.056133334835370384
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,7168,2048,8,256,1,256,balanced,0.19765333334604898
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,7168,2048,8,256,1,256,balanced,0.1681386629740397
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,7168,2048,8,256,1,256,balanced,0.05589866638183594
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,7168,2048,8,256,1,256,balanced,0.057333335280418396
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,7168,2048,8,256,1,256,balanced,0.20465600490570068
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,7168,2048,8,256,1,256,balanced,0.059402664502461754
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,7168,2048,8,256,1,256,balanced,0.17762666940689087
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,7168,2048,8,256,1,256,balanced,0.06015466650327047
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,7168,2048,8,256,1,256,power_law_1.01,0.19162240028381347
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,7168,2048,8,256,1,256,balanced,0.06471999982992808
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,7168,2048,8,256,1,256,balanced,0.20031466086705527
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,7168,2048,8,256,1,256,balanced,0.20399999618530273
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,7168,2048,8,256,1,256,power_law_1.01,0.1938688039779663
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,7168,2048,8,256,1,256,balanced,0.06625066697597504
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,7168,2048,8,256,1,256,balanced,0.06841066479682922
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,7168,2048,8,256,1,256,power_law_1.01,0.17772799730300903
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,7168,2048,8,256,1,256,balanced,0.20362667242685953
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,7168,2048,8,256,1,256,balanced,0.07720533510049184
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,7168,2048,8,256,1,256,power_law_1.01,0.18439040184020997
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,7168,2048,8,256,1,256,balanced,0.22613332668940225
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,7168,2048,8,256,1,256,power_law_1.01,0.19728000164031984
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,7168,2048,8,256,1,256,power_law_1.01,0.1934272050857544
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,7168,2048,8,256,1,256,balanced,0.1911146640777588
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,7168,2048,8,256,1,256,power_law_1.01,0.11484800577163697
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,7168,2048,8,256,1,256,power_law_1.01,0.19514880180358887
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,7168,2048,8,256,1,256,balanced,0.3478720188140869
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,7168,2048,8,256,1,256,power_law_1.01,0.11856000423431397
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,256,1,256,balanced,0.08316266536712646
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,7168,2048,8,256,1,256,power_law_1.01,0.19119999408721924
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,7168,2048,8,256,1,256,power_law_1.01,0.11514879465103149
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,7168,2048,8,256,1,256,balanced,0.34572267532348633
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,7168,2048,8,256,1,256,power_law_1.01,0.19082880020141602
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,256,1,256,balanced,0.09701866904894511
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,7168,2048,8,256,1,256,power_law_1.01,0.12026879787445069
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,7168,2048,8,256,1,256,power_law_1.01,0.18881920576095582
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,7168,2048,8,256,1,256,balanced,0.39209067821502686
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,256,1,256,balanced,0.10710400342941284
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,7168,2048,8,256,1,256,power_law_1.01,0.12083840370178223
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,7168,2048,8,256,1,256,power_law_1.01,0.18799359798431398
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,7168,2048,8,256,1,256,power_law_1.01,0.126528000831604
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,7168,2048,8,256,1,256,power_law_1.01,0.18279680013656616
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,7168,2048,8,256,1,256,power_law_1.01,0.12334719896316529
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,7168,2048,8,256,1,256,balanced,0.32819199562072754
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,7168,2048,8,256,1,256,power_law_1.01,0.17710720300674437
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,7168,2048,8,256,1,256,power_law_1.01,0.11829119920730591
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,7168,2048,8,256,1,256,power_law_1.01,0.18148479461669922
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,7168,2048,8,256,1,256,power_law_1.01,0.12184319496154786
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,7168,2048,8,256,1,256,power_law_1.01,0.17210240364074708
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,7168,2048,8,256,1,256,power_law_1.01,0.1214143991470337
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,7168,2048,8,256,1,256,balanced,0.5650293429692587
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,256,1,256,balanced,0.13387733697891235
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,7168,2048,8,256,1,256,power_law_1.01,0.1633471965789795
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,7168,2048,8,256,1,256,power_law_1.01,0.11863679885864258
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,7168,2048,8,256,1,256,power_law_1.01,0.047788798809051514
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,7168,2048,8,256,1,256,power_law_1.01,0.14260480403900147
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,7168,2048,8,256,1,256,power_law_1.01,0.11874560117721558
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,7168,2048,8,256,1,256,balanced,0.47117865085601807
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,256,1,256,balanced,0.1552906632423401
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,7168,2048,8,256,1,256,power_law_1.01,0.04661760032176972
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,7168,2048,8,256,1,256,power_law_1.01,0.2600320100784302
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,7168,2048,8,256,1,256,power_law_1.01,0.11822719573974609
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,7168,2048,8,256,1,256,power_law_1.01,0.04716159999370575
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,7168,2048,8,256,1,256,power_law_1.01,0.11777280569076538
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,7168,2048,8,256,1,256,power_law_1.01,0.18776320219039916
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,7168,2048,8,256,1,256,power_law_1.01,0.05211520195007324
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,7168,2048,8,256,1,256,power_law_1.01,0.11670399904251098
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,7168,2048,8,256,1,256,power_law_1.01,0.305676794052124
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,7168,2048,8,256,1,256,power_law_1.01,0.05234559774398804
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,7168,2048,8,256,1,256,power_law_1.01,0.1168895959854126
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,7168,2048,8,256,1,256,power_law_1.01,0.397708797454834
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,7168,2048,8,256,1,256,balanced,0.7316479682922363
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,7168,2048,8,256,1,256,power_law_1.01,0.11229439973831176
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,7168,2048,8,256,1,256,power_law_1.01,0.05230720043182373
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,7168,2048,8,256,1,256,power_law_1.01,0.5489471912384033
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,7168,2048,8,256,1,256,power_law_1.01,0.1774399995803833
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,7168,2048,8,256,1,256,power_law_1.01,0.05194240212440491
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,7168,2048,8,256,1,256,power_law_1.01,0.629695987701416
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,7168,2048,8,256,1,256,balanced,0.6081973314285278
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,7168,2048,8,256,1,256,power_law_1.01,0.15928959846496582
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,7168,2048,8,256,1,256,power_law_1.01,0.05338240265846252
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,256,1,256,balanced,0.203984002272288
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,7168,2048,8,256,1,256,power_law_1.01,0.9730688095092773
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,7168,2048,8,256,1,256,power_law_1.01,0.22261760234832764
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,7168,2048,8,256,1,256,power_law_1.01,0.05448960065841675
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,7168,2048,8,256,1,256,power_law_1.01,1.3872384071350097
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,7168,2048,8,256,1,256,power_law_1.01,0.26347520351409914
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,7168,2048,8,256,1,256,power_law_1.01,0.05421440005302429
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,7168,2048,8,256,1,256,power_law_1.01,2.1743295669555662
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,7168,2048,8,256,1,256,power_law_1.01,0.3713023900985718
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,7168,2048,8,256,1,256,power_law_1.01,0.05987840294837952
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,256,1,256,balanced,0.24843200047810873
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,7168,2048,8,256,1,256,power_law_1.01,0.4686079978942871
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,7168,2048,8,256,1,256,power_law_1.01,2.7309568405151365
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,7168,2048,8,256,1,256,power_law_1.01,0.06125440001487732
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,7168,2048,8,256,1,256,balanced,0.901642640431722
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,7168,2048,8,256,1,256,power_law_1.01,0.6689343929290772
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,7168,2048,8,256,1,256,power_law_1.01,0.06348800063133239
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,7168,2048,8,256,1,256,power_law_1.01,3.372832107543945
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,7168,2048,8,256,1,256,power_law_1.01,0.904793643951416
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,7168,2048,8,256,1,256,power_law_1.01,0.06748800277709961
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,7168,2048,8,256,1,256,power_law_1.01,1.3548095703125
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,7168,2048,8,256,1,256,power_law_1.2,0.18579839468002318
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,7168,2048,8,256,1,256,power_law_1.01,5.708230209350586
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,7168,2048,8,256,1,256,power_law_1.01,0.0723136007785797
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,7168,2048,8,256,1,256,balanced,0.7448266347249349
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,7168,2048,8,256,1,256,power_law_1.01,0.085343998670578
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,7168,2048,8,256,1,256,power_law_1.01,1.8711488723754883
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,7168,2048,8,256,1,256,power_law_1.2,0.18528000116348267
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,7168,2048,8,256,1,256,power_law_1.01,0.0886080026626587
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,7168,2048,8,256,1,256,power_law_1.2,0.17331839799880983
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,7168,2048,8,256,1,256,power_law_1.01,13.348300170898437
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,7168,2048,8,256,1,256,power_law_1.01,2.168396759033203
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,7168,2048,8,256,1,256,power_law_1.2,0.19093120098114014
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,7168,2048,8,256,1,256,power_law_1.01,0.1125440001487732
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,7168,2048,8,256,1,256,power_law_1.01,3.793164825439453
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,7168,2048,8,256,1,256,power_law_1.2,0.19474560022354126
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,7168,2048,8,256,1,256,power_law_1.2,0.1931712031364441
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,256,1,256,power_law_1.01,0.12319999933242798
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,7168,2048,8,256,1,256,power_law_1.01,7.976512145996094
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,256,1,256,balanced,0.348906675974528
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,7168,2048,8,256,1,256,power_law_1.2,0.1929535984992981
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,256,1,256,power_law_1.01,0.1565440058708191
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,7168,2048,8,256,1,256,power_law_1.2,0.19034240245819092
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,256,1,256,power_law_1.01,0.18982399702072145
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,7168,2048,8,256,1,256,power_law_1.2,0.18859519958496093
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,7168,2048,8,256,1,256,balanced,1.41265074412028
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,7168,2048,8,256,1,256,power_law_1.2,0.1859007954597473
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,7168,2048,8,256,1,256,power_law_1.2,0.1832576036453247
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,256,1,256,power_law_1.01,0.25921919345855715
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,7168,2048,8,256,1,256,power_law_1.2,0.17674239873886108
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,256,1,256,power_law_1.01,0.3661695957183838
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,7168,2048,8,256,1,256,balanced,1.1608106295267742
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,7168,2048,8,256,1,256,power_law_1.2,0.17204480171203612
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,7168,2048,8,256,1,256,power_law_1.2,0.1637503981590271
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,256,1,256,balanced,0.4408160050710042
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,256,1,256,power_law_1.01,0.4383039951324463
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,7168,2048,8,256,1,256,power_law_1.2,0.1566848039627075
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,7168,2048,8,256,1,256,power_law_1.2,0.14357759952545165
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,256,1,256,power_law_1.01,0.5862207889556885
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,7168,2048,8,256,1,256,power_law_1.2,0.2314176082611084
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,7168,2048,8,256,1,256,power_law_1.2,0.27577600479125974
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,256,1,256,power_law_1.01,0.8079999923706055
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,7168,2048,8,256,1,256,power_law_1.2,0.29896318912506104
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,7168,2048,8,256,1,256,power_law_1.2,0.46538238525390624
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,7168,2048,8,256,1,256,power_law_1.2,0.1115007996559143
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,7168,2048,8,256,1,256,power_law_1.2,0.6300415992736816
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,256,1,256,power_law_1.01,1.0774847984313964
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,7168,2048,8,256,1,256,power_law_1.2,0.11632640361785888
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,7168,2048,8,256,1,256,power_law_1.2,0.7485375881195069
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,7168,2048,8,256,1,256,power_law_1.2,0.11553280353546143
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,7168,2048,8,256,1,256,power_law_1.2,1.048902416229248
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,7168,2048,8,256,1,256,power_law_1.2,0.11793279647827148
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,7168,2048,8,256,1,256,power_law_1.2,1.7167295455932616
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,7168,2048,8,256,1,256,power_law_1.2,0.12004480361938477
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,7168,2048,8,256,1,256,power_law_1.2,2.4326335906982424
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,7168,2048,8,256,1,256,power_law_1.2,0.11944320201873779
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,256,1,256,power_law_1.01,1.3837568283081054
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,256,1,256,balanced,0.5497706731160482
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,7168,2048,8,256,1,256,power_law_1.2,3.769977569580078
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,7168,2048,8,256,1,256,power_law_1.2,0.11818879842758179
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,7168,2048,8,256,1,256,power_law_1.2,0.11868799924850464
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,7168,2048,8,256,1,256,power_law_1.2,5.8661247253417965
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,7168,2048,8,256,1,256,power_law_1.2,0.11818879842758179
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,7168,2048,8,256,1,256,power_law_1.2,8.167622375488282
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,7168,2048,8,256,1,256,power_law_1.2,0.11968640089035035
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,256,1,256,power_law_1.01,2.2021631240844726
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,7168,2048,8,256,1,256,power_law_1.2,0.1183359980583191
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,7168,2048,8,256,1,256,balanced,2.806960105895996
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,256,1,256,power_law_1.01,4.680729675292969
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,7168,2048,8,256,1,256,power_law_1.2,13.762675476074218
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,7168,2048,8,256,1,256,power_law_1.2,0.1136896014213562
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,7168,2048,8,256,1,256,power_law_1.2,0.11508480310440064
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,7168,2048,8,256,1,256,power_law_1.2,0.11239039897918701
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,7168,2048,8,256,1,256,balanced,2.302896022796631
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,7168,2048,8,256,1,256,power_law_1.2,34.840396118164065
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,7168,2048,8,256,1,256,power_law_1.2,0.10966399908065796
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,7168,2048,8,256,1,256,power_law_1.2,0.10474879741668701
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,7168,2048,8,256,1,256,power_law_1.2,0.14602240324020385
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,7168,2048,8,256,1,256,power_law_1.2,0.15829119682312012
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,256,1,256,balanced,0.8372480074564616
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,7168,2048,8,256,1,256,power_law_1.2,0.20179200172424316
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,7168,2048,8,256,1,256,power_law_1.2,0.2897088050842285
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,7168,2048,8,256,1,256,power_law_1.2,0.3380863904953003
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,7168,2048,8,256,1,256,power_law_1.2,0.48891520500183105
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,7168,2048,8,256,1,256,power_law_1.2,0.6565567970275878
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,7168,2048,8,256,1,256,power_law_1.2,1.0523136138916016
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,7168,2048,8,256,1,256,power_law_1.2,1.5353407859802246
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,7168,2048,8,256,1,256,power_law_1.2,2.376038360595703
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,7168,2048,8,256,1,256,power_law_1.2,3.057369613647461
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,7168,2048,8,256,1,256,power_law_1.2,4.382783889770508
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,7168,2048,8,256,1,256,power_law_1.2,8.76534423828125
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,7168,2048,8,256,1,256,power_law_1.2,18.892863464355468
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,256,1,256,balanced,1.6805866559346516
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,7168,2048,8,256,2,128,balanced,0.11024533708890279
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,7168,2048,8,256,2,128,balanced,0.10979732871055603
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,7168,2048,8,256,2,128,balanced,0.11424533526102702
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,7168,2048,8,256,1,256,power_law_1.2,0.047603198885917665
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,7168,2048,8,256,2,128,balanced,0.11665599544843037
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,7168,2048,8,256,2,128,balanced,0.11687999963760376
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,7168,2048,8,256,1,256,power_law_1.2,0.046911999583244324
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,7168,2048,8,256,2,128,balanced,0.2027519941329956
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,7168,2048,8,256,1,256,power_law_1.2,0.04720639884471893
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,7168,2048,8,256,2,128,balanced,0.20617065827051798
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,7168,2048,8,256,1,256,power_law_1.2,0.05198720097541809
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,7168,2048,8,256,2,128,balanced,0.20697067181269327
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,7168,2048,8,256,1,256,power_law_1.2,0.05198720097541809
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,7168,2048,8,256,2,128,balanced,0.20947200059890747
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,7168,2048,8,256,1,256,power_law_1.2,0.0526528000831604
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,7168,2048,8,256,2,128,balanced,0.19340799252192178
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,7168,2048,8,256,1,256,power_law_1.2,0.05249919891357422
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,7168,2048,8,256,2,128,balanced,0.20503467321395874
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,7168,2048,8,256,1,256,power_law_1.2,0.05413119792938233
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,7168,2048,8,256,2,128,balanced,0.2076746622721354
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,7168,2048,8,256,2,128,balanced,0.19773866732915243
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,7168,2048,8,256,1,256,power_law_1.2,0.055264002084732054
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,7168,2048,8,256,2,128,balanced,0.1957333286603292
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,7168,2048,8,256,1,256,power_law_1.2,0.057760000228881836
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,7168,2048,8,256,2,128,balanced,0.20397865772247314
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,7168,2048,8,256,1,256,power_law_1.2,0.06026880145072937
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,7168,2048,8,256,2,128,balanced,0.20292800664901733
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,7168,2048,8,256,1,256,power_law_1.2,0.06387839913368225
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,7168,2048,8,256,2,128,balanced,0.2027626633644104
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,7168,2048,8,256,1,256,power_law_1.2,0.06700800061225891
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,7168,2048,8,256,1,256,power_law_1.2,0.0688256025314331
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,7168,2048,8,256,2,128,balanced,0.2023893396059672
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,7168,2048,8,256,1,256,power_law_1.2,0.08517760038375854
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,7168,2048,8,256,2,128,balanced,0.20256000757217407
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,7168,2048,8,256,1,256,power_law_1.2,0.08565760254859925
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,7168,2048,8,256,1,256,power_law_1.2,0.10491520166397095
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,7168,2048,8,256,2,128,balanced,0.20949333906173706
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,7168,2048,8,256,1,256,power_law_1.2,0.1390720009803772
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,7168,2048,8,256,2,128,balanced,0.2032853364944458
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,256,1,256,power_law_1.2,0.15040639638900757
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,7168,2048,8,256,2,128,balanced,0.20320000251134238
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,256,1,256,power_law_1.2,0.22131199836730958
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,256,1,256,power_law_1.2,0.2890559911727905
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,7168,2048,8,256,2,128,balanced,0.19427732626597086
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,7168,2048,8,256,2,128,balanced,0.07732800145943959
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,256,1,256,power_law_1.2,0.4170048236846924
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,7168,2048,8,256,2,128,balanced,0.07765866816043854
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,7168,2048,8,256,2,128,balanced,0.36236266295115155
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,7168,2048,8,256,2,128,balanced,0.07807999849319458
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,256,1,256,power_law_1.2,0.5937727928161621
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,7168,2048,8,256,2,128,balanced,0.07996800045172374
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,7168,2048,8,256,2,128,balanced,0.07825600107510884
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,7168,2048,8,256,2,128,balanced,0.12342933813730876
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,256,1,256,power_law_1.2,0.7012415885925293
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,7168,2048,8,256,2,128,balanced,0.126309335231781
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,7168,2048,8,256,2,128,balanced,0.12827733159065247
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,7168,2048,8,256,2,128,balanced,0.3356746832529704
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,256,1,256,power_law_1.2,0.998316764831543
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,7168,2048,8,256,2,128,balanced,0.12922666470209757
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,7168,2048,8,256,2,128,balanced,0.043365334471066795
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,7168,2048,8,256,2,128,balanced,0.1312320033709208
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,7168,2048,8,256,2,128,balanced,0.04410133262475332
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,7168,2048,8,256,2,128,balanced,0.13460266590118408
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,7168,2048,8,256,2,128,power_law_1.01,0.12166399955749511
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,256,1,256,power_law_1.2,1.4711296081542968
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,7168,2048,8,256,2,128,balanced,0.04400533437728882
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,7168,2048,8,256,2,128,balanced,0.13479999701182047
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,7168,2048,8,256,2,128,power_law_1.01,0.19419519901275634
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,7168,2048,8,256,2,128,power_law_1.01,0.12273279428482056
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,7168,2048,8,256,2,128,balanced,0.04721599817276001
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,7168,2048,8,256,2,128,balanced,0.13037332892417908
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,256,1,256,power_law_1.2,1.9099199295043945
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,7168,2048,8,256,2,128,balanced,0.046762665112813316
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,7168,2048,8,256,2,128,power_law_1.01,0.10157439708709717
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,7168,2048,8,256,2,128,power_law_1.01,0.1919167995452881
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,7168,2048,8,256,2,128,balanced,0.47958401838938397
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,7168,2048,8,256,2,128,balanced,0.13326932986577353
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,7168,2048,8,256,2,128,balanced,0.0521066685517629
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,7168,2048,8,256,2,128,power_law_1.01,0.1757375955581665
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,7168,2048,8,256,2,128,power_law_1.01,0.11692800521850585
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,7168,2048,8,256,2,128,balanced,0.14009066422780356
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,7168,2048,8,256,2,128,balanced,0.05416533350944519
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,7168,2048,8,256,2,128,power_law_1.01,0.17749760150909424
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,7168,2048,8,256,2,128,power_law_1.01,0.12225919961929321
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,7168,2048,8,256,2,128,balanced,0.13823466499646506
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,256,1,256,power_law_1.2,2.748454475402832
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,7168,2048,8,256,2,128,balanced,0.05452266832192739
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,7168,2048,8,256,2,128,power_law_1.01,0.1992640018463135
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,7168,2048,8,256,2,128,power_law_1.01,0.12557439804077147
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,7168,2048,8,256,2,128,balanced,0.13730133573214212
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,7168,2048,8,256,2,128,balanced,0.05483733117580414
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,7168,2048,8,256,2,128,power_law_1.01,0.20163838863372802
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,7168,2048,8,256,2,128,power_law_1.01,0.1266111969947815
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,7168,2048,8,256,2,128,balanced,0.055386667450269066
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,256,1,256,power_law_1.2,3.8027198791503904
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,7168,2048,8,256,2,128,balanced,0.15155733625094095
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,7168,2048,8,256,2,128,power_law_1.01,0.2031167984008789
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,7168,2048,8,256,2,128,power_law_1.01,0.12464640140533448
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,7168,2048,8,256,2,128,balanced,0.055770665407180786
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,7168,2048,8,256,2,128,balanced,0.15105066696802774
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,7168,2048,8,256,2,128,power_law_1.01,0.11979520320892334
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,7168,2048,8,256,2,128,power_law_1.01,0.1986624002456665
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,7168,2048,8,256,2,128,balanced,0.6195946534474691
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,7168,2048,8,256,2,128,balanced,0.057477335135142006
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,256,1,256,power_law_1.2,8.071270751953126
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,7168,2048,8,256,2,128,power_law_1.01,0.1268288016319275
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,7168,2048,8,256,2,128,power_law_1.01,0.19468159675598146
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,7168,2048,8,256,2,128,balanced,0.05789866546789805
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,7168,2048,8,256,2,128,balanced,0.16918933391571045
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,7168,2048,8,256,2,128,power_law_1.01,0.1262336015701294
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,7168,2048,8,256,2,128,power_law_1.01,0.1970752000808716
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,7168,2048,8,256,2,128,balanced,0.059690664211908974
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,7168,2048,8,256,2,128,balanced,0.18196266889572144
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,7168,2048,8,256,2,128,power_law_1.01,0.19217920303344727
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,7168,2048,8,256,2,128,power_law_1.01,0.1258687973022461
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,7168,2048,8,256,2,128,balanced,0.06566399832566579
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,7168,2048,8,256,2,128,power_law_1.01,0.12784639596939087
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,7168,2048,8,256,2,128,power_law_1.01,0.1942911982536316
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,7168,2048,8,256,2,128,balanced,0.06675733129183452
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,7168,2048,8,256,2,128,balanced,0.2057653268178304
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,7168,2048,8,256,2,128,power_law_1.01,0.12499200105667115
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,7168,2048,8,256,2,128,power_law_1.01,0.19139839410781861
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,7168,2048,8,256,2,128,balanced,0.06865600248177846
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,7168,2048,8,256,2,128,power_law_1.01,0.12896640300750734
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,7168,2048,8,256,2,128,power_law_1.01,0.18289920091629028
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,7168,2048,8,256,2,128,balanced,0.2299999992052714
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,7168,2048,8,256,2,128,power_law_1.01,0.12400640249252319
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,7168,2048,8,256,2,128,power_law_1.01,0.18158719539642335
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,7168,2048,8,256,2,128,balanced,0.7616426944732666
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,7168,2048,8,256,2,128,balanced,0.0780320018529892
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,7168,2048,8,256,2,128,power_law_1.01,0.12212480306625366
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,7168,2048,8,256,2,128,power_law_1.01,0.17956479787826538
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,7168,2048,8,256,2,128,power_law_1.01,0.1464959979057312
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,7168,2048,8,256,2,128,power_law_1.01,0.1716096043586731
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,7168,2048,8,256,2,128,balanced,0.36072532335917157
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,7168,2048,8,256,2,128,power_law_1.01,0.16401920318603516
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,7168,2048,8,256,2,128,power_law_1.01,0.04764159917831421
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,7168,2048,8,256,2,128,power_law_1.01,0.17096960544586182
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,7168,2048,8,256,2,128,power_law_1.01,0.2044287919998169
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,7168,2048,8,256,2,128,power_law_1.01,0.04574080109596253
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,7168,2048,8,256,2,128,power_law_1.01,0.23420159816741942
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,7168,2048,8,256,2,128,power_law_1.01,0.0459199994802475
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,7168,2048,8,256,2,128,power_law_1.01,0.26635520458221434
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,7168,2048,8,256,2,128,power_law_1.01,0.30141439437866213
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,256,2,128,balanced,0.08444799979527791
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,7168,2048,8,256,2,128,power_law_1.01,0.049779200553894044
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,7168,2048,8,256,2,128,power_law_1.01,0.34652159214019773
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,7168,2048,8,256,2,128,power_law_1.01,0.3232320070266724
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,7168,2048,8,256,2,128,power_law_1.01,0.050361597537994386
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,7168,2048,8,256,2,128,balanced,0.4014933506647746
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,256,2,128,balanced,0.09880533814430237
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,7168,2048,8,256,2,128,power_law_1.2,0.19185279607772826
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,7168,2048,8,256,2,128,power_law_1.01,0.44632320404052733
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,7168,2048,8,256,2,128,power_law_1.01,0.0516543984413147
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,7168,2048,8,256,2,128,power_law_1.01,0.4701632022857666
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,7168,2048,8,256,2,128,power_law_1.01,0.052223998308181765
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,7168,2048,8,256,2,128,power_law_1.01,0.6315839767456055
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,7168,2048,8,256,2,128,power_law_1.2,0.1909119963645935
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,7168,2048,8,256,2,128,power_law_1.01,0.5517248153686524
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,256,2,128,balanced,0.10904533664385478
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,7168,2048,8,256,2,128,power_law_1.01,0.05366399884223938
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,7168,2048,8,256,2,128,power_law_1.2,0.14086400270462035
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,7168,2048,8,256,2,128,power_law_1.01,0.7886591911315918
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,7168,2048,8,256,2,128,power_law_1.01,0.7686399936676025
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,7168,2048,8,256,2,128,power_law_1.01,0.05516800284385681
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,7168,2048,8,256,2,128,power_law_1.2,0.16442240476608277
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,7168,2048,8,256,2,128,power_law_1.01,0.05553280115127564
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,7168,2048,8,256,2,128,power_law_1.01,1.1851712226867677
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,7168,2048,8,256,2,128,power_law_1.01,0.9773887634277344
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,7168,2048,8,256,2,128,power_law_1.01,0.05870720148086548
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,7168,2048,8,256,2,128,power_law_1.2,0.20329599380493163
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,7168,2048,8,256,2,128,balanced,0.5751306613286337
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,7168,2048,8,256,2,128,power_law_1.01,1.597555160522461
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,7168,2048,8,256,2,128,power_law_1.01,1.7065343856811523
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,7168,2048,8,256,2,128,balanced,1.1856906414031982
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,7168,2048,8,256,2,128,power_law_1.01,0.06032639741897583
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,7168,2048,8,256,2,128,power_law_1.2,0.1981055974960327
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,7168,2048,8,256,2,128,power_law_1.01,2.030803108215332
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,7168,2048,8,256,2,128,power_law_1.01,0.06302080154418946
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,7168,2048,8,256,2,128,power_law_1.01,2.043756866455078
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,7168,2048,8,256,2,128,power_law_1.2,0.203110408782959
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,7168,2048,8,256,2,128,power_law_1.01,0.06639360189437866
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,7168,2048,8,256,2,128,power_law_1.2,0.1958016037940979
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,256,2,128,balanced,0.13727466265360513
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,7168,2048,8,256,2,128,power_law_1.01,3.274534225463867
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,7168,2048,8,256,2,128,power_law_1.01,2.5701311111450194
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,7168,2048,8,256,2,128,power_law_1.2,0.19816319942474364
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,7168,2048,8,256,2,128,power_law_1.01,0.071424001455307
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,7168,2048,8,256,2,128,power_law_1.2,0.19516799449920655
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,7168,2048,8,256,2,128,power_law_1.01,4.317772674560547
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,7168,2048,8,256,2,128,power_law_1.01,0.08170239925384522
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,7168,2048,8,256,2,128,power_law_1.01,6.550566101074219
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,7168,2048,8,256,2,128,power_law_1.2,0.19438079595565796
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,256,2,128,balanced,0.16060800353686014
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,7168,2048,8,256,2,128,power_law_1.01,0.09317759871482849
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,7168,2048,8,256,2,128,power_law_1.2,0.192684805393219
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,7168,2048,8,256,2,128,power_law_1.01,9.807520294189453
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,7168,2048,8,256,2,128,balanced,0.7469600041707357
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,7168,2048,8,256,2,128,power_law_1.01,0.1095039963722229
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,7168,2048,8,256,2,128,power_law_1.2,0.18906240463256835
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,7168,2048,8,256,2,128,power_law_1.2,0.1711680054664612
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,7168,2048,8,256,2,128,power_law_1.2,0.1807039976119995
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,256,2,128,power_law_1.01,0.11914240121841431
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,7168,2048,8,256,2,128,power_law_1.2,0.17237119674682616
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,256,2,128,balanced,0.2129866679509481
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,7168,2048,8,256,2,128,power_law_1.2,0.19717760086059571
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,256,2,128,power_law_1.01,0.15185920000076295
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,7168,2048,8,256,2,128,power_law_1.2,0.24593279361724854
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,256,2,128,power_law_1.01,0.19032959938049315
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,7168,2048,8,256,2,128,power_law_1.2,0.2744191884994507
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,7168,2048,8,256,2,128,power_law_1.2,0.3380095958709717
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,256,2,128,balanced,0.26153600215911865
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,7168,2048,8,256,2,128,power_law_1.2,0.404531192779541
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,256,2,128,power_law_1.01,0.23736319541931153
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,7168,2048,8,256,2,128,balanced,0.9210560321807861
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,7168,2048,8,256,2,128,power_law_1.2,0.5087808132171631
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,256,2,128,power_law_1.01,0.32279679775238035
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,7168,2048,8,256,2,128,power_law_1.2,0.6850687980651855
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,7168,2048,8,256,2,128,power_law_1.2,1.173804759979248
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,256,2,128,power_law_1.01,0.4111040115356445
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,7168,2048,8,256,2,128,power_law_1.2,1.713248062133789
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,256,2,128,power_law_1.01,0.626585578918457
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,7168,2048,8,256,2,128,power_law_1.2,2.7405439376831056
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,7168,2048,8,256,2,128,power_law_1.2,3.1196544647216795
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,256,2,128,power_law_1.01,0.7993663787841797
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,256,2,128,balanced,0.36608533064524335
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,7168,2048,8,256,2,128,power_law_1.2,4.76943359375
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,256,2,128,power_law_1.01,1.0490943908691406
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,7168,2048,8,256,2,128,power_law_1.2,7.180441284179688
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,7168,2048,8,256,2,128,balanced,2.361695925394694
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,256,2,128,power_law_1.01,1.2815168380737305
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,7168,2048,8,256,2,128,power_law_1.2,22.470681762695314
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,7168,2048,8,256,2,128,balanced,1.4388267199198406
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,256,2,128,power_law_1.01,2.0743743896484377
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,256,2,128,balanced,0.4660213390986125
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,256,2,128,power_law_1.01,4.387839889526367
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,256,2,128,balanced,0.5799520015716553
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,7168,2048,8,256,2,128,power_law_1.2,0.12090879678726196
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,256,2,128,balanced,0.8998346328735352
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,7168,2048,8,256,2,128,power_law_1.2,0.12322560548782349
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,7168,2048,8,256,2,128,power_law_1.2,0.10491520166397095
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,7168,2048,8,256,2,128,balanced,2.8643147150675454
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,7168,2048,8,256,2,128,power_law_1.2,0.12400640249252319
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,7168,2048,8,256,2,128,power_law_1.2,0.11966079473495483
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,7168,2048,8,256,2,128,power_law_1.2,0.11737600564956666
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,7168,2048,8,256,2,128,power_law_1.2,0.1250432014465332
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,7168,2048,8,256,2,128,power_law_1.2,0.12641919851303102
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,7168,2048,8,256,2,128,power_law_1.2,0.12609920501708985
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,7168,2048,8,256,2,128,power_law_1.2,0.12471040487289428
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,7168,2048,8,256,2,128,power_law_1.2,0.12399359941482543
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,7168,2048,8,256,2,128,power_law_1.2,0.12624640464782716
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,7168,2048,8,256,2,128,power_law_1.2,0.1245695948600769
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,7168,2048,8,256,2,128,power_law_1.2,0.12400000095367432
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,7168,2048,8,256,2,128,power_law_1.2,0.1251456022262573
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,7168,2048,8,256,2,128,power_law_1.2,0.12012799978256225
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,7168,2048,8,256,2,128,power_law_1.2,0.13609600067138672
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,7168,2048,8,256,2,128,power_law_1.2,0.14392319917678834
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,7168,2048,8,256,2,128,power_law_1.2,0.1963711977005005
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,7168,2048,8,256,2,128,power_law_1.2,0.26207358837127687
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,7168,2048,8,256,2,128,power_law_1.2,0.309497594833374
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,256,2,128,balanced,1.8150134086608887
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,7168,2048,8,256,2,128,power_law_1.2,0.4257472038269043
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,7168,2048,8,256,2,128,power_law_1.2,0.5313600063323974
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,7168,2048,8,256,2,128,power_law_1.2,0.789574384689331
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,7168,2048,8,256,2,128,power_law_1.2,1.1420479774475099
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,7168,2048,8,256,4,64,balanced,0.0925546685854594
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,7168,2048,8,256,4,64,balanced,0.08787199854850769
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,7168,2048,8,256,2,128,power_law_1.2,1.4981504440307618
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,7168,2048,8,256,4,64,balanced,0.09346133470535278
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,7168,2048,8,256,2,128,power_law_1.2,2.3050432205200195
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,7168,2048,8,256,4,64,balanced,0.09620799620946248
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,7168,2048,8,256,2,128,power_law_1.2,2.723641586303711
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,7168,2048,8,256,2,128,power_law_1.2,0.047244799137115476
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,7168,2048,8,256,4,64,balanced,0.12050666411717732
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,7168,2048,8,256,2,128,power_law_1.2,5.068435287475586
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,7168,2048,8,256,4,64,balanced,0.19559999306996664
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,7168,2048,8,256,2,128,power_law_1.2,0.04597119987010956
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,7168,2048,8,256,2,128,power_law_1.2,0.04550400078296661
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,7168,2048,8,256,4,64,balanced,0.21426665782928467
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,7168,2048,8,256,2,128,power_law_1.2,14.05927734375
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,7168,2048,8,256,4,64,balanced,0.2025066614151001
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,7168,2048,8,256,2,128,power_law_1.2,0.05084800124168396
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,7168,2048,8,256,4,64,balanced,0.19986132780710855
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,7168,2048,8,256,2,128,power_law_1.2,0.05125759840011597
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,7168,2048,8,256,4,64,balanced,0.21228265762329102
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,7168,2048,8,256,2,128,power_law_1.2,0.05273600220680237
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,7168,2048,8,256,4,64,balanced,0.20284799734751383
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,7168,2048,8,256,2,128,power_law_1.2,0.05343359708786011
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,7168,2048,8,256,4,64,balanced,0.20084265867869058
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,7168,2048,8,256,2,128,power_law_1.2,0.0548799991607666
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,7168,2048,8,256,4,64,balanced,0.22058133284250894
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,7168,2048,8,256,2,128,power_law_1.2,0.05504000186920166
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,7168,2048,8,256,4,64,balanced,0.19085333744684854
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,7168,2048,8,256,2,128,power_law_1.2,0.058156800270080564
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,7168,2048,8,256,4,64,balanced,0.21342400709788004
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,7168,2048,8,256,2,128,power_law_1.2,0.060153597593307497
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,7168,2048,8,256,4,64,balanced,0.21600000063578287
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,7168,2048,8,256,2,128,power_law_1.2,0.062105602025985716
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,7168,2048,8,256,4,64,balanced,0.18928533792495728
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,7168,2048,8,256,2,128,power_law_1.2,0.06407039761543273
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,7168,2048,8,256,4,64,balanced,0.2084746758143107
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,7168,2048,8,256,2,128,power_law_1.2,0.07145599722862243
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,7168,2048,8,256,4,64,balanced,0.2042613426844279
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,7168,2048,8,256,2,128,power_law_1.2,0.08009600043296813
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,7168,2048,8,256,4,64,balanced,0.20995734135309854
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,7168,2048,8,256,2,128,power_law_1.2,0.08498560190200806
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,7168,2048,8,256,2,128,power_law_1.2,0.09607040286064147
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,7168,2048,8,256,4,64,balanced,0.2063680092493693
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,7168,2048,8,256,2,128,power_law_1.2,0.11709439754486084
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,7168,2048,8,256,4,64,balanced,0.06452266871929169
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,7168,2048,8,256,4,64,balanced,0.20651199420293173
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,7168,2048,8,256,4,64,balanced,0.06422399977842967
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,7168,2048,8,256,4,64,balanced,0.06401599943637848
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,256,2,128,power_law_1.2,0.13871999979019164
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,7168,2048,8,256,4,64,power_law_1.01,0.1997760057449341
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,7168,2048,8,256,4,64,balanced,0.20576000213623047
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,7168,2048,8,256,4,64,balanced,0.06718933085600536
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,256,2,128,power_law_1.2,0.18753279447555543
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,7168,2048,8,256,4,64,power_law_1.01,0.19769599437713622
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,7168,2048,8,256,4,64,balanced,0.0805866668621699
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,256,2,128,power_law_1.2,0.243123197555542
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,7168,2048,8,256,4,64,balanced,0.13212266564369202
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,7168,2048,8,256,4,64,power_law_1.01,0.179967999458313
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,7168,2048,8,256,4,64,balanced,0.3911679983139038
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,7168,2048,8,256,4,64,balanced,0.12997333208719888
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,7168,2048,8,256,4,64,power_law_1.01,0.15460480451583863
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,7168,2048,8,256,4,64,balanced,0.13268267114957175
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,256,2,128,power_law_1.2,0.28614399433135984
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,7168,2048,8,256,4,64,balanced,0.04345599810282389
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,7168,2048,8,256,4,64,power_law_1.01,0.1702911972999573
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,7168,2048,8,256,4,64,balanced,0.1267039974530538
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,256,2,128,power_law_1.2,0.4452991962432861
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,7168,2048,8,256,4,64,balanced,0.043696001172065735
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,7168,2048,8,256,4,64,balanced,0.13845333456993103
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,7168,2048,8,256,4,64,power_law_1.01,0.1743615984916687
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,7168,2048,8,256,4,64,balanced,0.04374399781227112
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,7168,2048,8,256,4,64,balanced,0.3550613323847453
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,7168,2048,8,256,4,64,balanced,0.13085866967837015
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,7168,2048,8,256,4,64,power_law_1.01,0.1823040008544922
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,256,2,128,power_law_1.2,0.6016960144042969
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,7168,2048,8,256,4,64,balanced,0.046821330984433494
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,7168,2048,8,256,4,64,balanced,0.12326400478680928
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,7168,2048,8,256,4,64,power_law_1.01,0.18703999519348144
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,256,2,128,power_law_1.2,0.7532415866851807
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,7168,2048,8,256,4,64,balanced,0.04710933566093445
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,7168,2048,8,256,4,64,balanced,0.1323306659857432
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,7168,2048,8,256,4,64,balanced,0.05453333258628845
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,7168,2048,8,256,4,64,power_law_1.01,0.1673535943031311
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,7168,2048,8,256,4,64,balanced,0.13062399625778198
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,7168,2048,8,256,4,64,balanced,0.05622933308283488
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,256,2,128,power_law_1.2,1.1910271644592285
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,7168,2048,8,256,4,64,power_law_1.01,0.17776639461517335
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,7168,2048,8,256,4,64,balanced,0.05701333284378052
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,7168,2048,8,256,4,64,balanced,0.1421386698881785
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,7168,2048,8,256,4,64,balanced,0.5076533158620199
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,7168,2048,8,256,4,64,power_law_1.01,0.17950079441070557
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,256,2,128,power_law_1.2,1.4858624458312988
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,7168,2048,8,256,4,64,balanced,0.05665066838264465
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,7168,2048,8,256,4,64,balanced,0.14593600233395895
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,7168,2048,8,256,4,64,balanced,0.057301332553227745
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,7168,2048,8,256,4,64,power_law_1.01,0.18695679903030396
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,7168,2048,8,256,4,64,balanced,0.14375999569892883
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,7168,2048,8,256,4,64,balanced,0.05801600217819214
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,256,2,128,power_law_1.2,2.1686912536621095
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,7168,2048,8,256,4,64,power_law_1.01,0.18748799562454224
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,7168,2048,8,256,4,64,balanced,0.0595360000928243
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,7168,2048,8,256,4,64,balanced,0.15501333276430765
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,7168,2048,8,256,4,64,power_law_1.01,0.18286720514297486
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,256,2,128,power_law_1.2,3.044953536987305
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,7168,2048,8,256,4,64,balanced,0.06108800073464712
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,7168,2048,8,256,4,64,balanced,0.15613333384195963
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,7168,2048,8,256,4,64,power_law_1.01,0.18434560298919678
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,7168,2048,8,256,4,64,balanced,0.06262933214505513
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,256,2,128,power_law_1.2,7.118041229248047
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,7168,2048,8,256,4,64,power_law_1.01,0.18595839738845826
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,7168,2048,8,256,4,64,balanced,0.17688000202178955
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,7168,2048,8,256,4,64,balanced,0.06805866460005443
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,7168,2048,8,256,4,64,balanced,0.6547626654307047
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,7168,2048,8,256,4,64,balanced,0.06899733344713847
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,7168,2048,8,256,4,64,power_law_1.01,0.18149759769439697
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,7168,2048,8,256,4,64,balanced,0.1891146699587504
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,7168,2048,8,256,4,64,balanced,0.07155733307202657
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,7168,2048,8,256,4,64,power_law_1.01,0.21838719844818116
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,7168,2048,8,256,4,64,power_law_1.01,0.12787840366363526
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,7168,2048,8,256,4,64,power_law_1.01,0.20821120738983154
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,7168,2048,8,256,4,64,balanced,0.21518399318059286
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,7168,2048,8,256,4,64,power_law_1.01,0.12869759798049926
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,7168,2048,8,256,4,64,power_law_1.01,0.2860543966293335
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,7168,2048,8,256,4,64,balanced,0.08061333497365315
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,7168,2048,8,256,4,64,power_law_1.01,0.11330560445785523
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,7168,2048,8,256,4,64,power_law_1.01,0.3234816074371338
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,7168,2048,8,256,4,64,power_law_1.01,0.09299200177192687
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,7168,2048,8,256,4,64,balanced,0.239519993464152
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,7168,2048,8,256,4,64,power_law_1.01,0.1019327998161316
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,7168,2048,8,256,4,64,power_law_1.01,0.4078656196594238
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,7168,2048,8,256,4,64,balanced,0.8039413293202718
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,7168,2048,8,256,4,64,power_law_1.01,0.11703039407730102
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,7168,2048,8,256,4,64,power_law_1.01,0.5035200119018555
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,7168,2048,8,256,4,64,power_law_1.01,0.12539520263671874
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,7168,2048,8,256,4,64,balanced,0.3798186779022217
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,256,4,64,balanced,0.08790399630864461
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,7168,2048,8,256,4,64,power_law_1.01,0.7241600036621094
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,7168,2048,8,256,4,64,power_law_1.01,0.12334719896316529
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,7168,2048,8,256,4,64,power_law_1.01,0.8386943817138672
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,256,4,64,balanced,0.1037600040435791
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,7168,2048,8,256,4,64,power_law_1.01,0.12294399738311768
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,7168,2048,8,256,4,64,power_law_1.01,1.3309696197509766
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,7168,2048,8,256,4,64,power_law_1.01,0.12005759477615356
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,256,4,64,balanced,0.11506666739781697
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,7168,2048,8,256,4,64,balanced,0.42026134332021076
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,7168,2048,8,256,4,64,power_law_1.01,1.822528076171875
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,7168,2048,8,256,4,64,power_law_1.01,0.12463359832763672
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,7168,2048,8,256,4,64,power_law_1.01,0.12845439910888673
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,7168,2048,8,256,4,64,power_law_1.01,2.030899238586426
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,7168,2048,8,256,4,64,power_law_1.01,0.12670719623565674
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,7168,2048,8,256,4,64,power_law_1.01,0.1314239978790283
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,7168,2048,8,256,4,64,power_law_1.01,3.873311996459961
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,7168,2048,8,256,4,64,power_law_1.01,0.1258944034576416
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,7168,2048,8,256,4,64,power_law_1.01,0.13237760066986085
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,256,4,64,balanced,0.14688533544540405
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,7168,2048,8,256,4,64,power_law_1.01,8.053433227539063
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,7168,2048,8,256,4,64,balanced,0.6038986841837565
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,7168,2048,8,256,4,64,power_law_1.01,0.13667839765548706
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,7168,2048,8,256,4,64,balanced,1.2523307005564372
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,7168,2048,8,256,4,64,power_law_1.01,0.15029120445251465
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,256,4,64,balanced,0.17235199610392252
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,7168,2048,8,256,4,64,power_law_1.01,0.17363200187683106
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,7168,2048,8,256,4,64,power_law_1.01,0.20814080238342286
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,7168,2048,8,256,4,64,power_law_1.01,0.2608448028564453
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,7168,2048,8,256,4,64,power_law_1.01,0.3358527898788452
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,7168,2048,8,256,4,64,power_law_1.01,0.05100160241127014
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,7168,2048,8,256,4,64,balanced,0.7800479729970297
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,7168,2048,8,256,4,64,power_law_1.01,0.4297791957855225
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,256,4,64,balanced,0.2324906587600708
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,7168,2048,8,256,4,64,power_law_1.01,0.04928640127182007
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,7168,2048,8,256,4,64,power_law_1.01,0.5671167850494385
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,7168,2048,8,256,4,64,power_law_1.01,0.04696959853172302
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,7168,2048,8,256,4,64,power_law_1.01,0.7182079792022705
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,7168,2048,8,256,4,64,power_law_1.01,0.050195199251174924
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,7168,2048,8,256,4,64,power_law_1.01,0.05145599842071533
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,7168,2048,8,256,4,64,power_law_1.01,1.0314559936523438
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,7168,2048,8,256,4,64,power_law_1.01,0.05322880148887634
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,256,4,64,balanced,0.2861706614494324
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,7168,2048,8,256,4,64,power_law_1.01,0.05372160077095032
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,7168,2048,8,256,4,64,power_law_1.01,1.3900799751281738
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,7168,2048,8,256,4,64,power_law_1.01,0.05563520193099976
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,7168,2048,8,256,4,64,power_law_1.01,1.8611583709716797
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,7168,2048,8,256,4,64,power_law_1.01,0.05875200033187866
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,7168,2048,8,256,4,64,power_law_1.01,0.05790719985961914
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,7168,2048,8,256,4,64,power_law_1.01,2.619686317443848
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,7168,2048,8,256,4,64,power_law_1.01,0.06087679862976074
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,7168,2048,8,256,4,64,balanced,0.9616426626841227
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,7168,2048,8,256,4,64,power_law_1.01,0.06234239935874939
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,7168,2048,8,256,4,64,power_law_1.01,5.798470306396484
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,7168,2048,8,256,4,64,power_law_1.01,0.0640447974205017
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,7168,2048,8,256,4,64,power_law_1.01,0.06949120163917541
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,7168,2048,8,256,4,64,power_law_1.01,0.07574399709701538
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,7168,2048,8,256,4,64,power_law_1.01,0.07808640003204345
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,256,4,64,balanced,0.406490683555603
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,7168,2048,8,256,4,64,power_law_1.2,0.1928704023361206
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,7168,2048,8,256,4,64,power_law_1.01,0.0831167995929718
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,7168,2048,8,256,4,64,power_law_1.2,0.1938367962837219
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,7168,2048,8,256,4,64,power_law_1.01,0.10845439434051514
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,7168,2048,8,256,4,64,power_law_1.2,0.10439039468765259
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,7168,2048,8,256,4,64,power_law_1.2,0.13931519985198976
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,256,4,64,power_law_1.01,0.1172287940979004
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,7168,2048,8,256,4,64,power_law_1.2,0.1597759962081909
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,256,4,64,power_law_1.01,0.14776320457458497
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,7168,2048,8,256,4,64,balanced,2.508021354675293
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,7168,2048,8,256,4,64,power_law_1.2,0.18883199691772462
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,256,4,64,power_law_1.01,0.16968319416046143
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,256,4,64,balanced,0.533946673075358
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,7168,2048,8,256,4,64,power_law_1.2,0.18177920579910278
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,7168,2048,8,256,4,64,balanced,1.5029813448588054
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,7168,2048,8,256,4,64,power_law_1.2,0.18981759548187255
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,256,4,64,power_law_1.01,0.2287168025970459
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,7168,2048,8,256,4,64,power_law_1.2,0.16380159854888915
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,256,4,64,power_law_1.01,0.29630720615386963
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,7168,2048,8,256,4,64,power_law_1.2,0.19531519412994386
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,256,4,64,power_law_1.01,0.4344128131866455
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,7168,2048,8,256,4,64,power_law_1.2,0.17783039808273315
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,256,4,64,power_law_1.01,0.547219181060791
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,7168,2048,8,256,4,64,power_law_1.2,0.18723200559616088
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,256,4,64,power_law_1.01,0.7706751823425293
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,7168,2048,8,256,4,64,power_law_1.2,0.19598079919815065
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,256,4,64,power_law_1.01,1.0656703948974608
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,7168,2048,8,256,4,64,power_law_1.2,0.18176640272140504
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,7168,2048,8,256,4,64,power_law_1.2,0.17272959947586058
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,256,4,64,balanced,0.6783040364583334
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,256,4,64,power_law_1.01,1.2552703857421874
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,7168,2048,8,256,4,64,power_law_1.2,0.19844479560852052
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,256,4,64,power_law_1.01,2.1317888259887696
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,7168,2048,8,256,4,64,power_law_1.2,0.17842559814453124
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,7168,2048,8,256,4,64,power_law_1.2,0.2121216058731079
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,256,4,64,power_law_1.01,4.153606414794922
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,7168,2048,8,256,4,64,power_law_1.2,0.26168959140777587
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,7168,2048,8,256,4,64,power_law_1.2,0.3268800020217896
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,7168,2048,8,256,4,64,power_law_1.2,0.3799295902252197
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,7168,2048,8,256,4,64,power_law_1.2,0.5121535778045654
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,7168,2048,8,256,4,64,power_law_1.2,0.6826303958892822
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,7168,2048,8,256,4,64,power_law_1.2,0.8839743614196778
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,7168,2048,8,256,4,64,power_law_1.2,1.235769557952881
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,7168,2048,8,256,4,64,power_law_1.2,1.6658432006835937
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,7168,2048,8,256,4,64,power_law_1.2,2.3622079849243165
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,256,4,64,balanced,1.0418933232625325
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,7168,2048,8,256,4,64,power_law_1.2,3.049491119384766
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,7168,2048,8,256,4,64,power_law_1.2,4.924409484863281
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,7168,2048,8,256,4,64,balanced,2.9865919748942056
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,7168,2048,8,256,4,64,power_law_1.2,11.507718658447265
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,7168,2048,8,256,4,64,power_law_1.2,0.12802560329437257
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,7168,2048,8,256,4,64,power_law_1.2,0.12637439966201783
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,7168,2048,8,256,4,64,power_law_1.2,0.08692479729652405
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,7168,2048,8,256,4,64,power_law_1.2,0.0883520007133484
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,7168,2048,8,256,4,64,power_law_1.2,0.10371840000152588
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,7168,2048,8,256,4,64,power_law_1.2,0.11433600187301636
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,7168,2048,8,256,4,64,power_law_1.2,0.12629760503768922
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,7168,2048,8,256,4,64,power_law_1.2,0.1208575963973999
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,7168,2048,8,256,4,64,power_law_1.2,0.118777596950531
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,7168,2048,8,256,4,64,power_law_1.2,0.1308608055114746
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,7168,2048,8,256,4,64,power_law_1.2,0.12200319766998291
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,7168,2048,8,256,4,64,power_law_1.2,0.12903679609298707
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,7168,2048,8,256,4,64,power_law_1.2,0.12174079418182374
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,7168,2048,8,256,4,64,power_law_1.2,0.12424960136413574
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,7168,2048,8,256,4,64,power_law_1.2,0.13164160251617432
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,7168,2048,8,256,4,64,power_law_1.2,0.13460479974746703
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,7168,2048,8,256,4,64,power_law_1.2,0.147705602645874
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,7168,2048,8,256,4,64,power_law_1.2,0.17065600156784058
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,256,4,64,balanced,2.0707839330037436
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,7168,2048,8,256,4,64,power_law_1.2,0.1903807997703552
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,7168,2048,8,256,4,64,power_law_1.2,0.23815679550170898
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,7168,2048,8,256,4,64,power_law_1.2,0.05135999917984009
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,7168,2048,8,256,4,64,power_law_1.2,0.29395198822021484
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,7168,2048,8,256,4,64,power_law_1.2,0.049107199907302855
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,7168,2048,8,256,4,64,power_law_1.2,0.3733952045440674
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,7168,2048,8,256,4,64,power_law_1.2,0.046387198567390445
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,7168,2048,8,256,4,64,power_law_1.2,0.048819199204444885
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,7168,2048,8,256,4,64,power_law_1.2,0.4969600200653076
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,7168,2048,8,256,4,64,power_law_1.2,0.05314559936523437
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,7168,2048,8,256,4,64,power_law_1.2,0.6508992195129395
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,7168,2048,8,256,4,64,power_law_1.2,0.05427200198173523
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,7168,2048,8,256,4,64,power_law_1.2,0.0543615996837616
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,7168,2048,8,256,4,64,power_law_1.2,0.880735969543457
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,7168,2048,8,256,4,64,power_law_1.2,0.05614719986915588
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,7168,2048,8,256,4,64,power_law_1.2,0.05626879930496216
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,7168,2048,8,256,4,64,power_law_1.2,1.4307264328002929
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,7168,2048,8,256,4,64,power_law_1.2,0.058976000547409056
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,7168,2048,8,256,4,64,power_law_1.2,0.061843198537826535
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,7168,2048,8,256,4,64,power_law_1.2,1.6273664474487304
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,7168,2048,8,256,4,64,power_law_1.2,0.0639743983745575
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,7168,2048,8,256,4,64,power_law_1.2,0.06540799736976624
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,7168,2048,8,256,4,64,power_law_1.2,2.386195182800293
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,7168,2048,8,256,4,64,power_law_1.2,0.07014399766921997
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,7168,2048,8,256,4,64,power_law_1.2,0.07559679746627808
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,7168,2048,8,256,4,64,power_law_1.2,4.084223937988281
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,7168,2048,8,256,4,64,power_law_1.2,0.0807039976119995
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,7168,2048,8,256,8,32,balanced,0.05465066432952881
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,7168,2048,8,256,4,64,power_law_1.2,0.09098240137100219
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,7168,2048,8,256,4,64,power_law_1.2,8.056281280517577
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,7168,2048,8,256,8,32,balanced,0.054602667689323425
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,7168,2048,8,256,4,64,power_law_1.2,0.1091264009475708
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,7168,2048,8,256,8,32,balanced,0.054431999723116554
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,7168,2048,8,256,8,32,balanced,0.05718400080998739
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,7168,2048,8,256,8,32,balanced,0.06071466704209646
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,256,4,64,power_law_1.2,0.12387839555740357
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,7168,2048,8,256,8,32,balanced,0.07250133156776428
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,256,4,64,power_law_1.2,0.17943040132522584
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,7168,2048,8,256,8,32,balanced,0.047210668524106346
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,7168,2048,8,256,8,32,balanced,0.07322666545708974
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,256,4,64,power_law_1.2,0.21264638900756835
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,7168,2048,8,256,8,32,balanced,0.07281066477298737
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,7168,2048,8,256,8,32,balanced,0.047594666481018066
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,7168,2048,8,256,8,32,balanced,0.07299200197060902
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,7168,2048,8,256,8,32,balanced,0.04730666677157084
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,256,4,64,power_law_1.2,0.2999743938446045
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,7168,2048,8,256,8,32,balanced,0.05093333125114441
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,7168,2048,8,256,8,32,balanced,0.07377066711584727
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,256,4,64,power_law_1.2,0.3877120018005371
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,7168,2048,8,256,8,32,balanced,0.052560001611709595
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,7168,2048,8,256,8,32,balanced,0.07539199789365132
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,7168,2048,8,256,8,32,balanced,0.07551999886830647
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,7168,2048,8,256,8,32,balanced,0.05875200033187866
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,256,4,64,power_law_1.2,0.5389247894287109
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,7168,2048,8,256,8,32,balanced,0.07534400125344594
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,7168,2048,8,256,8,32,balanced,0.05906666815280914
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,256,4,64,power_law_1.2,0.783897590637207
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,7168,2048,8,256,8,32,balanced,0.062319998939832054
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,7168,2048,8,256,8,32,balanced,0.0775626649459203
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,7168,2048,8,256,8,32,balanced,0.06234666705131531
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,7168,2048,8,256,8,32,balanced,0.08016000191370647
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,256,4,64,power_law_1.2,1.0716287612915039
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,7168,2048,8,256,8,32,balanced,0.06354666749636333
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,7168,2048,8,256,8,32,balanced,0.08031466603279114
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,256,4,64,power_law_1.2,1.5885696411132812
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,7168,2048,8,256,8,32,balanced,0.06509333352247874
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,7168,2048,8,256,8,32,balanced,0.08475200335184734
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,7168,2048,8,256,8,32,balanced,0.06554666658242543
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,256,4,64,power_law_1.2,1.7256000518798829
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,7168,2048,8,256,8,32,balanced,0.09275733431180318
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,7168,2048,8,256,8,32,balanced,0.0673333356777827
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,256,4,64,power_law_1.2,2.6457984924316404
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,7168,2048,8,256,8,32,balanced,0.09681066870689392
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,7168,2048,8,256,8,32,balanced,0.06951466699441274
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,256,4,64,power_law_1.2,6.512281799316407
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,7168,2048,8,256,8,32,balanced,0.07460266848405202
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,7168,2048,8,256,8,32,balanced,0.10878933469454448
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,7168,2048,8,256,8,32,balanced,0.07618666688601176
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,7168,2048,8,256,8,32,balanced,0.12309333682060242
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,7168,2048,8,256,8,32,balanced,0.0804319977760315
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,7168,2048,8,256,8,32,balanced,0.09166933099428813
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,7168,2048,8,256,8,32,balanced,0.14547733465830484
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,7168,2048,8,256,8,32,balanced,0.1002506713072459
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,7168,2048,8,256,8,32,balanced,0.043237333496411644
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,7168,2048,8,256,8,32,balanced,0.04393066465854645
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,7168,2048,8,256,8,32,balanced,0.12115733822186787
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,7168,2048,8,256,8,32,balanced,0.16821332772572836
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,7168,2048,8,256,8,32,balanced,0.04403733213742574
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,7168,2048,8,256,8,32,balanced,0.047695999344189964
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,7168,2048,8,256,8,32,balanced,0.13917866349220276
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,7168,2048,8,256,8,32,balanced,0.0496373325586319
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,7168,2048,8,256,8,32,balanced,0.058320000767707825
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,7168,2048,8,256,8,32,balanced,0.2143519918123881
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,7168,2048,8,256,8,32,balanced,0.17330666383107504
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,7168,2048,8,256,8,32,balanced,0.05932266513506571
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,7168,2048,8,256,8,32,balanced,0.06058666606744131
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,7168,2048,8,256,8,32,balanced,0.06098133325576782
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,7168,2048,8,256,8,32,balanced,0.21015999714533487
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,7168,2048,8,256,8,32,balanced,0.06158400078614553
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,7168,2048,8,256,8,32,balanced,0.06276266773541768
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,7168,2048,8,256,8,32,balanced,0.26680533091227215
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,7168,2048,8,256,8,32,balanced,0.06374399860699971
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,7168,2048,8,256,8,32,power_law_1.01,0.09242240190505982
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,7168,2048,8,256,8,32,balanced,0.06555733581384023
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,7168,2048,8,256,8,32,balanced,0.28405867020289105
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,7168,2048,8,256,8,32,power_law_1.01,0.07352319955825806
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,7168,2048,8,256,8,32,balanced,0.06655466556549072
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,7168,2048,8,256,8,32,power_law_1.01,0.0644927978515625
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,7168,2048,8,256,8,32,balanced,0.07258666555086772
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,7168,2048,8,256,8,32,power_law_1.01,0.06584320068359376
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,7168,2048,8,256,8,32,balanced,0.07459733386834462
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,7168,2048,8,256,8,32,power_law_1.01,0.06508799791336059
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,7168,2048,8,256,8,32,balanced,0.07681066791216533
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,7168,2048,8,256,8,32,balanced,0.35793598492940265
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,7168,2048,8,256,8,32,balanced,0.3591573238372803
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,7168,2048,8,256,8,32,power_law_1.01,0.0679040014743805
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,7168,2048,8,256,8,32,power_law_1.01,0.06986879706382751
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,7168,2048,8,256,8,32,power_law_1.01,0.0697983980178833
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,7168,2048,8,256,8,32,balanced,0.08923733234405518
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,7168,2048,8,256,8,32,power_law_1.01,0.05907840132713318
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,7168,2048,8,256,8,32,power_law_1.01,0.07125120162963867
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,7168,2048,8,256,8,32,power_law_1.01,0.07104640007019043
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,7168,2048,8,256,8,32,power_law_1.01,0.05374079942703247
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,7168,2048,8,256,8,32,power_law_1.01,0.07259520292282104
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,7168,2048,8,256,8,32,power_law_1.01,0.05314559936523437
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,7168,2048,8,256,8,32,balanced,0.5066239833831787
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,7168,2048,8,256,8,32,power_law_1.01,0.07217280268669128
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,7168,2048,8,256,8,32,power_law_1.01,0.05486080050468445
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,7168,2048,8,256,8,32,balanced,0.4694240093231201
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,256,8,32,balanced,0.09640000263849895
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,7168,2048,8,256,8,32,power_law_1.01,0.07432320117950439
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,7168,2048,8,256,8,32,power_law_1.01,0.05792639851570129
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,7168,2048,8,256,8,32,power_law_1.01,0.07514240145683289
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,256,8,32,balanced,0.11507200201352437
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,7168,2048,8,256,8,32,power_law_1.01,0.05902079939842224
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,7168,2048,8,256,8,32,power_law_1.01,0.07895680069923401
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,7168,2048,8,256,8,32,power_law_1.01,0.06054400205612183
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,256,8,32,balanced,0.12873066465059915
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,7168,2048,8,256,8,32,power_law_1.01,0.08422399759292602
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,7168,2048,8,256,8,32,power_law_1.01,0.06090880036354065
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,7168,2048,8,256,8,32,power_law_1.01,0.08867200016975403
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,7168,2048,8,256,8,32,balanced,0.6488586664199829
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,7168,2048,8,256,8,32,power_law_1.01,0.059622400999069215
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,7168,2048,8,256,8,32,power_law_1.01,0.09134719967842102
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,7168,2048,8,256,8,32,power_law_1.01,0.06303359866142273
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,7168,2048,8,256,8,32,power_law_1.01,0.11941759586334229
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,7168,2048,8,256,8,32,power_law_1.01,0.0671231985092163
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,7168,2048,8,256,8,32,power_law_1.01,0.12373119592666626
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,256,8,32,balanced,0.16809600591659546
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,7168,2048,8,256,8,32,balanced,0.5688213507334391
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,7168,2048,8,256,8,32,power_law_1.01,0.06756479740142822
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,7168,2048,8,256,8,32,power_law_1.01,0.13723520040512086
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,7168,2048,8,256,8,32,power_law_1.01,0.07015680074691773
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,7168,2048,8,256,8,32,power_law_1.01,0.15998079776763915
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,7168,2048,8,256,8,32,power_law_1.01,0.19514880180358887
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,256,8,32,balanced,0.19589867194493613
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,7168,2048,8,256,8,32,power_law_1.01,0.07826560139656066
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,7168,2048,8,256,8,32,power_law_1.01,0.22801918983459474
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,7168,2048,8,256,8,32,power_law_1.01,0.08169599771499633
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,7168,2048,8,256,8,32,power_law_1.01,0.3255872011184692
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,7168,2048,8,256,8,32,power_law_1.01,0.08681600093841553
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,7168,2048,8,256,8,32,power_law_1.01,0.06007680296897888
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,7168,2048,8,256,8,32,balanced,0.8195306460062662
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,7168,2048,8,256,8,32,power_law_1.01,0.3892863988876343
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,7168,2048,8,256,8,32,power_law_1.01,0.10373120307922364
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,7168,2048,8,256,8,32,power_law_1.01,0.05580800175666809
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,7168,2048,8,256,8,32,power_law_1.01,0.5355711936950683
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,7168,2048,8,256,8,32,power_law_1.01,0.04935039877891541
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,7168,2048,8,256,8,32,power_law_1.01,0.11918720006942748
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,256,8,32,balanced,0.28091732660929364
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,7168,2048,8,256,8,32,power_law_1.01,0.6972095966339111
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,7168,2048,8,256,8,32,power_law_1.01,0.052185600996017455
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,7168,2048,8,256,8,32,power_law_1.01,0.1409343957901001
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,7168,2048,8,256,8,32,power_law_1.01,0.8880255699157715
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,7168,2048,8,256,8,32,power_law_1.01,0.054604798555374146
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,7168,2048,8,256,8,32,power_law_1.01,0.16291840076446534
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,7168,2048,8,256,8,32,power_law_1.01,0.05644800066947937
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,7168,2048,8,256,8,32,power_law_1.01,1.2834624290466308
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,7168,2048,8,256,8,32,power_law_1.01,0.2175679922103882
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,256,8,32,balanced,0.35762667655944824
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,7168,2048,8,256,8,32,power_law_1.01,0.05850239992141724
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,7168,2048,8,256,8,32,power_law_1.01,0.2569792032241821
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,7168,2048,8,256,8,32,power_law_1.01,2.8501056671142577
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,7168,2048,8,256,8,32,power_law_1.01,0.05978239774703979
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,7168,2048,8,256,8,32,balanced,0.8281439940134684
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,7168,2048,8,256,8,32,power_law_1.01,0.36561920642852785
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,7168,2048,8,256,8,32,power_law_1.01,0.060313600301742556
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,7168,2048,8,256,8,32,power_law_1.01,0.4392255783081055
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,7168,2048,8,256,8,32,power_law_1.01,0.062438398599624634
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,7168,2048,8,256,8,32,power_law_1.01,0.06624640226364135
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,7168,2048,8,256,8,32,power_law_1.01,0.6481023788452148
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,7168,2048,8,256,8,32,power_law_1.01,0.06704639792442321
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,7168,2048,8,256,8,32,power_law_1.01,0.8559103965759277
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,7168,2048,8,256,8,32,balanced,1.234335978825887
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,7168,2048,8,256,8,32,power_law_1.01,0.06934400200843811
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,7168,2048,8,256,8,32,power_law_1.01,1.142137622833252
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,7168,2048,8,256,8,32,power_law_1.01,0.07374079823493958
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,7168,2048,8,256,8,32,power_law_1.01,0.08010879755020142
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,7168,2048,8,256,8,32,power_law_1.01,1.6120128631591797
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,256,8,32,balanced,0.5182826519012451
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,7168,2048,8,256,8,32,power_law_1.2,0.09257599711418152
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,7168,2048,8,256,8,32,power_law_1.01,0.08395519852638245
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,7168,2048,8,256,8,32,power_law_1.01,3.151238441467285
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,7168,2048,8,256,8,32,power_law_1.2,0.07349759936332703
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,7168,2048,8,256,8,32,power_law_1.01,0.09520639777183533
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,7168,2048,8,256,8,32,power_law_1.2,0.059436798095703125
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,7168,2048,8,256,8,32,power_law_1.01,0.11331839561462402
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,7168,2048,8,256,8,32,power_law_1.2,0.06691200137138367
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,7168,2048,8,256,8,32,power_law_1.2,0.06424959897994995
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,7168,2048,8,256,8,32,power_law_1.2,0.06695039868354798
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,256,8,32,power_law_1.01,0.12108800411224366
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,256,8,32,balanced,0.6730026404062907
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,7168,2048,8,256,8,32,power_law_1.2,0.06992639899253845
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,256,8,32,power_law_1.01,0.161407995223999
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,7168,2048,8,256,8,32,power_law_1.2,0.0717311978340149
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,256,8,32,power_law_1.01,0.19322240352630615
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,7168,2048,8,256,8,32,power_law_1.2,0.07094399929046631
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,7168,2048,8,256,8,32,power_law_1.2,0.07241600155830383
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,256,8,32,power_law_1.01,0.27153921127319336
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,7168,2048,8,256,8,32,power_law_1.2,0.07385600209236146
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,256,8,32,power_law_1.01,0.32330238819122314
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,7168,2048,8,256,8,32,power_law_1.2,0.07479040026664734
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,7168,2048,8,256,8,32,power_law_1.2,0.07747200131416321
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,256,8,32,power_law_1.01,0.45357441902160645
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,7168,2048,8,256,8,32,power_law_1.2,0.08071039915084839
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,256,8,32,power_law_1.01,0.6266816139221192
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,7168,2048,8,256,8,32,power_law_1.2,0.0869055986404419
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,7168,2048,8,256,8,32,power_law_1.2,0.06884480118751526
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,7168,2048,8,256,8,32,power_law_1.2,0.09273599982261657
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,256,8,32,balanced,0.8403893311818441
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,7168,2048,8,256,8,32,balanced,1.6362560590108235
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,7168,2048,8,256,8,32,power_law_1.2,0.05875200033187866
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,7168,2048,8,256,8,32,power_law_1.2,0.09556480050086975
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,256,8,32,power_law_1.01,0.8881088256835937
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,7168,2048,8,256,8,32,power_law_1.2,0.048147198557853696
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,7168,2048,8,256,8,32,power_law_1.2,0.12339199781417846
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,256,8,32,power_law_1.01,1.1513855934143067
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,7168,2048,8,256,8,32,power_law_1.2,0.05440000295639038
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,7168,2048,8,256,8,32,power_law_1.2,0.12753920555114745
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,7168,2048,8,256,8,32,balanced,2.4389012654622397
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,7168,2048,8,256,8,32,power_law_1.2,0.055820798873901366
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,7168,2048,8,256,8,32,power_law_1.2,0.15599360466003417
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,256,8,32,power_law_1.01,1.5436991691589355
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,7168,2048,8,256,8,32,power_law_1.2,0.05544319748878479
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,7168,2048,8,256,8,32,power_law_1.2,0.17141120433807372
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,7168,2048,8,256,8,32,power_law_1.2,0.058259201049804685
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,256,8,32,power_law_1.01,2.2547264099121094
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,7168,2048,8,256,8,32,power_law_1.2,0.24039039611816407
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,7168,2048,8,256,8,32,power_law_1.2,0.058924800157546996
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,7168,2048,8,256,8,32,power_law_1.2,0.2558079957962036
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,256,8,32,power_law_1.01,4.870284652709961
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,7168,2048,8,256,8,32,power_law_1.2,0.0595583975315094
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,7168,2048,8,256,8,32,power_law_1.2,0.3745408058166504
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,7168,2048,8,256,8,32,power_law_1.2,0.06115840077400207
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,7168,2048,8,256,8,32,power_law_1.2,0.4721856117248535
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,7168,2048,8,256,8,32,power_law_1.2,0.0632960021495819
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,7168,2048,8,256,8,32,power_law_1.2,0.6396607875823974
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,7168,2048,8,256,8,32,power_law_1.2,0.06592000126838685
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,256,8,32,balanced,1.297808011372884
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,7168,2048,8,256,8,32,power_law_1.2,0.8129535675048828
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,7168,2048,8,256,8,32,power_law_1.2,0.0686847984790802
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,7168,2048,8,256,8,32,power_law_1.2,1.0429375648498536
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,7168,2048,8,256,8,32,power_law_1.2,0.07111679911613464
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,7168,2048,8,256,8,32,power_law_1.2,1.7296127319335937
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,7168,2048,8,256,8,32,power_law_1.2,0.07971839904785157
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,7168,2048,8,256,8,32,power_law_1.2,0.08409600257873535
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,7168,2048,8,256,8,32,power_law_1.2,3.8352832794189453
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,7168,2048,8,256,8,32,power_law_1.2,0.08945919871330262
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,7168,2048,8,256,8,32,power_law_1.2,0.11672320365905761
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,7168,2048,8,256,8,32,power_law_1.2,0.12362240552902222
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,7168,2048,8,256,8,32,power_law_1.2,0.1575551986694336
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,7168,2048,8,256,8,32,power_law_1.2,0.1733247995376587
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,7168,2048,8,256,8,32,power_law_1.2,0.23494400978088378
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,7168,2048,8,256,8,32,power_law_1.2,0.2761087894439697
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,7168,2048,8,256,8,32,power_law_1.2,0.38943359851837156
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,7168,2048,8,256,8,32,power_law_1.2,0.47136640548706055
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,7168,2048,8,256,8,32,power_law_1.2,0.7279615879058838
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,7168,2048,8,256,8,32,power_law_1.2,0.9822976112365722
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,7168,2048,8,256,8,32,power_law_1.2,1.2589119911193847
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,7168,2048,8,256,8,32,power_law_1.2,2.113542366027832
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,256,8,32,balanced,2.5773493448893228
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,7168,2048,8,256,8,32,power_law_1.2,4.083161544799805
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,7168,2048,8,256,8,32,power_law_1.2,0.05945600271224975
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,7168,2048,8,256,8,32,power_law_1.2,0.05563520193099976
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,7168,2048,8,256,8,32,power_law_1.2,0.04707199931144714
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,7168,2048,8,256,8,32,power_law_1.2,0.05275520086288452
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,7168,2048,8,256,8,32,power_law_1.2,0.054713600873947145
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,7168,2048,8,256,8,32,power_law_1.2,0.05694720149040222
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,7168,2048,8,256,8,32,power_law_1.2,0.05978239774703979
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,7168,2048,8,256,8,32,power_law_1.2,0.06077439785003662
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,7168,2048,8,256,8,32,power_law_1.2,0.0605184018611908
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,7168,2048,8,256,16,16,balanced,0.05343999962011973
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,7168,2048,8,256,8,32,power_law_1.2,0.06119040250778198
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,7168,2048,8,256,16,16,balanced,0.05413866539796194
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,7168,2048,8,256,8,32,power_law_1.2,0.06554239988327026
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,7168,2048,8,256,16,16,balanced,0.054618666569391884
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,7168,2048,8,256,16,16,balanced,0.05859733124574026
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,7168,2048,8,256,8,32,power_law_1.2,0.06855040192604064
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,7168,2048,8,256,16,16,balanced,0.07232533395290375
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,7168,2048,8,256,8,32,power_law_1.2,0.07012479901313781
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,7168,2048,8,256,16,16,balanced,0.07427200178305308
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,7168,2048,8,256,8,32,power_law_1.2,0.07760639786720276
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,7168,2048,8,256,16,16,balanced,0.07445333401362102
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,7168,2048,8,256,8,32,power_law_1.2,0.08264960050582885
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,7168,2048,8,256,16,16,balanced,0.07609066863854726
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,7168,2048,8,256,8,32,power_law_1.2,0.08538240194320679
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,7168,2048,8,256,16,16,balanced,0.07622933387756348
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,7168,2048,8,256,16,16,balanced,0.07654933134714763
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,7168,2048,8,256,8,32,power_law_1.2,0.09876480102539062
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,7168,2048,8,256,16,16,balanced,0.07769066592057546
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,7168,2048,8,256,16,16,balanced,0.07866666714350383
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,7168,2048,8,256,8,32,power_law_1.2,0.12213759422302246
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,7168,2048,8,256,16,16,balanced,0.07902400195598602
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,7168,2048,8,256,16,16,balanced,0.08066133161385854
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,7168,2048,8,256,16,16,balanced,0.083514670530955
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,256,8,32,power_law_1.2,0.13100160360336305
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,7168,2048,8,256,16,16,balanced,0.08405866225560506
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,7168,2048,8,256,16,16,balanced,0.08842133482297261
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,256,8,32,power_law_1.2,0.17189760208129884
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,7168,2048,8,256,16,16,balanced,0.09839466214179993
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,256,8,32,power_law_1.2,0.2435136079788208
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,7168,2048,8,256,16,16,balanced,0.1070240040620168
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,7168,2048,8,256,16,16,balanced,0.12337066729863484
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,256,8,32,power_law_1.2,0.2944000005722046
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,7168,2048,8,256,16,16,balanced,0.04674666623274485
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,7168,2048,8,256,16,16,balanced,0.13596266508102417
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,256,8,32,power_law_1.2,0.4257535934448242
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,7168,2048,8,256,16,16,balanced,0.04737600187460581
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,7168,2048,8,256,16,16,balanced,0.04795200129350027
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,7168,2048,8,256,16,16,balanced,0.16699733336766562
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,256,8,32,power_law_1.2,0.5761087894439697
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,7168,2048,8,256,16,16,balanced,0.05197333296140035
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,7168,2048,8,256,16,16,balanced,0.05453333258628845
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,256,8,32,power_law_1.2,0.696608018875122
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,7168,2048,8,256,16,16,balanced,0.06329600016276042
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,7168,2048,8,256,16,16,balanced,0.19106133778889975
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,7168,2048,8,256,16,16,balanced,0.06443733473618825
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,256,8,32,power_law_1.2,1.0344320297241212
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,7168,2048,8,256,16,16,power_law_1.01,0.06332799792289734
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,7168,2048,8,256,16,16,balanced,0.04429866870244344
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,7168,2048,8,256,16,16,balanced,0.06551466882228851
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,7168,2048,8,256,16,16,balanced,0.06595733265082042
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,256,8,32,power_law_1.2,1.456486415863037
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,7168,2048,8,256,16,16,balanced,0.24885332584381104
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,7168,2048,8,256,16,16,power_law_1.01,0.07660800218582153
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,7168,2048,8,256,16,16,balanced,0.04513066510359446
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,7168,2048,8,256,16,16,balanced,0.06769066552321117
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,7168,2048,8,256,16,16,balanced,0.046522667010625206
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,7168,2048,8,256,16,16,power_law_1.01,0.06146559715270996
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,7168,2048,8,256,16,16,balanced,0.06922133266925812
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,256,8,32,power_law_1.2,2.2448448181152343
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,7168,2048,8,256,16,16,balanced,0.05147733290990194
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,7168,2048,8,256,16,16,power_law_1.01,0.0626688003540039
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,7168,2048,8,256,16,16,balanced,0.06982400019963582
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,7168,2048,8,256,16,16,balanced,0.054527997970581055
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,7168,2048,8,256,16,16,balanced,0.07141333321730296
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,7168,2048,8,256,16,16,power_law_1.01,0.07095680236816407
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,7168,2048,8,256,16,16,balanced,0.3123840093612671
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,256,8,32,power_law_1.2,3.2382270812988283
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,7168,2048,8,256,16,16,power_law_1.01,0.052934402227401735
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,7168,2048,8,256,16,16,balanced,0.0640533318122228
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,7168,2048,8,256,16,16,balanced,0.0736053337653478
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,7168,2048,8,256,16,16,power_law_1.01,0.06741759777069092
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,7168,2048,8,256,16,16,balanced,0.0666240006685257
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,256,8,32,power_law_1.2,7.4937278747558596
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,7168,2048,8,256,16,16,balanced,0.07799466451009114
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,7168,2048,8,256,16,16,power_law_1.01,0.06308479905128479
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,7168,2048,8,256,16,16,power_law_1.01,0.07155839800834655
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,7168,2048,8,256,16,16,balanced,0.06705600023269653
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,7168,2048,8,256,16,16,balanced,0.07965866724650066
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,7168,2048,8,256,16,16,power_law_1.01,0.07186560034751892
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,7168,2048,8,256,16,16,power_law_1.01,0.052147197723388675
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,7168,2048,8,256,16,16,balanced,0.06768533090750377
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,7168,2048,8,256,16,16,power_law_1.01,0.07438079714775085
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,7168,2048,8,256,16,16,balanced,0.08659733335177104
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,7168,2048,8,256,16,16,power_law_1.01,0.05356159806251526
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,7168,2048,8,256,16,16,balanced,0.06846933563550313
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,7168,2048,8,256,16,16,balanced,0.42980265617370605
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,7168,2048,8,256,16,16,power_law_1.01,0.07363200187683105
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,7168,2048,8,256,16,16,power_law_1.01,0.05560960173606873
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,7168,2048,8,256,16,16,balanced,0.09878399968147278
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,7168,2048,8,256,16,16,balanced,0.07001066704591115
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,7168,2048,8,256,16,16,power_law_1.01,0.057657599449157715
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,7168,2048,8,256,16,16,power_law_1.01,0.074099200963974
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,7168,2048,8,256,16,16,balanced,0.11043733358383179
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,7168,2048,8,256,16,16,balanced,0.07180800040562947
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,7168,2048,8,256,16,16,power_law_1.01,0.06062080264091492
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,7168,2048,8,256,16,16,power_law_1.01,0.07662720084190369
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,7168,2048,8,256,16,16,balanced,0.07382933298746745
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,7168,2048,8,256,16,16,balanced,0.1311360001564026
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,7168,2048,8,256,16,16,power_law_1.01,0.07973759770393371
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,7168,2048,8,256,16,16,power_law_1.01,0.06305279731750488
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,7168,2048,8,256,16,16,balanced,0.07455466687679291
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,7168,2048,8,256,16,16,power_law_1.01,0.06354560256004334
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,7168,2048,8,256,16,16,power_law_1.01,0.08275840282440186
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,7168,2048,8,256,16,16,balanced,0.15027200182278952
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,7168,2048,8,256,16,16,balanced,0.08170133332411449
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,7168,2048,8,256,16,16,power_law_1.01,0.06549760103225707
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,7168,2048,8,256,16,16,power_law_1.01,0.08797439932823181
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,7168,2048,8,256,16,16,balanced,0.08422933022181193
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,7168,2048,8,256,16,16,balanced,0.5524746576944987
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,7168,2048,8,256,16,16,balanced,0.1901386578877767
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,7168,2048,8,256,16,16,power_law_1.01,0.06516479849815368
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,7168,2048,8,256,16,16,power_law_1.01,0.09445760250091553
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,7168,2048,8,256,16,16,balanced,0.08828799923261006
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,7168,2048,8,256,16,16,power_law_1.01,0.06849920153617858
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,7168,2048,8,256,16,16,power_law_1.01,0.09459840059280396
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,7168,2048,8,256,16,16,power_law_1.01,0.07134079933166504
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,7168,2048,8,256,16,16,power_law_1.01,0.11403520107269287
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,7168,2048,8,256,16,16,balanced,0.2316533327102661
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,7168,2048,8,256,16,16,balanced,0.10276800394058228
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,7168,2048,8,256,16,16,power_law_1.01,0.0756928026676178
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,7168,2048,8,256,16,16,power_law_1.01,0.11743359565734864
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,7168,2048,8,256,16,16,power_law_1.01,0.08140799999237061
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,7168,2048,8,256,16,16,power_law_1.01,0.14583679437637329
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,7168,2048,8,256,16,16,power_law_1.01,0.08873599767684937
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,7168,2048,8,256,16,16,power_law_1.01,0.16858880519866942
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,7168,2048,8,256,16,16,balanced,0.3183679978052775
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,7168,2048,8,256,16,16,power_law_1.01,0.09160959720611572
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,7168,2048,8,256,16,16,power_law_1.01,0.21431679725646974
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,256,16,16,balanced,0.11868799726168315
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,7168,2048,8,256,16,16,balanced,0.6871253649393717
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,7168,2048,8,256,16,16,power_law_1.01,0.10917760133743286
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,7168,2048,8,256,16,16,power_law_1.01,0.24606080055236818
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,7168,2048,8,256,16,16,power_law_1.2,0.06835839748382569
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,256,16,16,balanced,0.14275200168291727
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,7168,2048,8,256,16,16,power_law_1.01,0.11930880546569825
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,7168,2048,8,256,16,16,power_law_1.01,0.327622389793396
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,7168,2048,8,256,16,16,power_law_1.2,0.07610880136489868
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,7168,2048,8,256,16,16,power_law_1.01,0.15520000457763672
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,7168,2048,8,256,16,16,balanced,0.40565331776936847
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,7168,2048,8,256,16,16,power_law_1.01,0.45949440002441405
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,256,16,16,balanced,0.15771200259526572
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,7168,2048,8,256,16,16,power_law_1.2,0.05514879822731018
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,7168,2048,8,256,16,16,power_law_1.01,0.18446719646453857
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,7168,2048,8,256,16,16,power_law_1.01,0.5835455894470215
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,7168,2048,8,256,16,16,power_law_1.01,0.05791360139846802
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,7168,2048,8,256,16,16,power_law_1.2,0.06309760212898255
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,7168,2048,8,256,16,16,power_law_1.01,0.22338559627532958
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,7168,2048,8,256,16,16,power_law_1.01,0.8380607604980469
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,7168,2048,8,256,16,16,power_law_1.01,0.2661312103271484
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,7168,2048,8,256,16,16,power_law_1.2,0.07180160284042358
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,7168,2048,8,256,16,16,power_law_1.01,0.0658623993396759
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,256,16,16,balanced,0.21760533253351846
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,7168,2048,8,256,16,16,power_law_1.01,0.9428544044494629
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,7168,2048,8,256,16,16,power_law_1.01,0.3884416103363037
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,7168,2048,8,256,16,16,power_law_1.2,0.06656640172004699
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,7168,2048,8,256,16,16,power_law_1.01,0.05137919783592224
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,7168,2048,8,256,16,16,power_law_1.2,0.07204480171203613
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,7168,2048,8,256,16,16,power_law_1.01,0.4901120185852051
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,7168,2048,8,256,16,16,power_law_1.01,0.055257600545883176
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,7168,2048,8,256,16,16,balanced,0.5777706702550253
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,7168,2048,8,256,16,16,power_law_1.01,1.4485631942749024
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,7168,2048,8,256,16,16,power_law_1.2,0.07212160229682922
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,256,16,16,balanced,0.26892266670862836
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,7168,2048,8,256,16,16,power_law_1.01,0.7000832080841064
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,7168,2048,8,256,16,16,power_law_1.01,0.05891839861869812
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,7168,2048,8,256,16,16,power_law_1.01,2.7900928497314452
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,7168,2048,8,256,16,16,power_law_1.2,0.07330560088157653
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,7168,2048,8,256,16,16,power_law_1.01,0.9099648475646973
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,7168,2048,8,256,16,16,power_law_1.01,0.06026880145072937
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,7168,2048,8,256,16,16,power_law_1.2,0.07359359860420227
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,7168,2048,8,256,16,16,power_law_1.01,0.06517120003700257
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,7168,2048,8,256,16,16,power_law_1.01,1.1786304473876954
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,7168,2048,8,256,16,16,balanced,1.0352213382720947
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,7168,2048,8,256,16,16,power_law_1.2,0.07637119889259339
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,7168,2048,8,256,16,16,power_law_1.01,0.06749439835548401
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,7168,2048,8,256,16,16,power_law_1.01,1.8011135101318358
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,7168,2048,8,256,16,16,power_law_1.2,0.07928959727287292
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,256,16,16,balanced,0.40172266960144043
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,7168,2048,8,256,16,16,power_law_1.01,0.06800640225410462
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,7168,2048,8,256,16,16,power_law_1.01,3.4926078796386717
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,7168,2048,8,256,16,16,power_law_1.2,0.07964800000190735
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,7168,2048,8,256,16,16,balanced,0.7375893592834473
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,7168,2048,8,256,16,16,power_law_1.01,0.06851840019226074
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,7168,2048,8,256,16,16,power_law_1.2,0.08436480164527893
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,7168,2048,8,256,16,16,power_law_1.01,0.06959999799728393
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,7168,2048,8,256,16,16,power_law_1.2,0.08856959939002991
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,7168,2048,8,256,16,16,power_law_1.01,0.0769536018371582
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,256,16,16,balanced,0.4989866813023885
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,7168,2048,8,256,16,16,power_law_1.2,0.09555839896202087
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,7168,2048,8,256,16,16,power_law_1.01,0.07741439938545228
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,7168,2048,8,256,16,16,power_law_1.2,0.09848960041999817
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,7168,2048,8,256,16,16,power_law_1.01,0.0831488013267517
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,7168,2048,8,256,16,16,power_law_1.2,0.11411199569702149
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,7168,2048,8,256,16,16,power_law_1.01,0.09400960206985473
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,7168,2048,8,256,16,16,power_law_1.2,0.1238144040107727
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,7168,2048,8,256,16,16,power_law_1.01,0.0974016010761261
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,256,16,16,balanced,0.716970682144165
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,7168,2048,8,256,16,16,balanced,0.9221866925557455
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,7168,2048,8,256,16,16,power_law_1.2,0.14746240377426148
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,7168,2048,8,256,16,16,power_law_1.01,0.10575360059738159
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,7168,2048,8,256,16,16,power_law_1.2,0.18186880350112916
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,7168,2048,8,256,16,16,power_law_1.01,0.12821760177612304
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,7168,2048,8,256,16,16,power_law_1.2,0.22221438884735106
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,7168,2048,8,256,16,16,power_law_1.2,0.2740544080734253
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,7168,2048,8,256,16,16,power_law_1.2,0.39229440689086914
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,256,16,16,power_law_1.01,0.14561920166015624
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,7168,2048,8,256,16,16,power_law_1.2,0.46450557708740237
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,256,16,16,power_law_1.01,0.19207040071487427
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,256,16,16,balanced,0.9320000012715658
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,7168,2048,8,256,16,16,power_law_1.2,0.6534976005554199
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,256,16,16,power_law_1.01,0.2550015926361084
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,7168,2048,8,256,16,16,power_law_1.2,0.9271488189697266
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,256,16,16,power_law_1.01,0.3084991931915283
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,7168,2048,8,256,16,16,power_law_1.2,1.2216511726379395
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,256,16,16,power_law_1.01,0.41787519454956057
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,7168,2048,8,256,16,16,power_law_1.2,1.8390207290649414
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,256,16,16,power_law_1.01,0.6309823989868164
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,7168,2048,8,256,16,16,balanced,1.9776959419250488
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,7168,2048,8,256,16,16,power_law_1.2,3.8403839111328124
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,7168,2048,8,256,16,16,balanced,1.4201919237772624
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,256,16,16,power_law_1.01,0.7415167808532714
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,256,16,16,power_law_1.01,1.0619520187377929
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,256,16,16,power_law_1.01,1.4321344375610352
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,256,16,16,balanced,1.1638240019480388
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,256,16,16,power_law_1.01,1.656083106994629
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,256,16,16,power_law_1.01,3.0426559448242188
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,256,16,16,power_law_1.01,6.397900772094727
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,256,16,16,balanced,1.8113706906636555
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,7168,2048,8,256,16,16,power_law_1.2,0.0527616024017334
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,7168,2048,8,256,16,16,power_law_1.2,0.06287360191345215
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,7168,2048,8,256,16,16,power_law_1.2,0.04842239916324616
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,7168,2048,8,256,16,16,power_law_1.2,0.05320320129394531
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,7168,2048,8,256,16,16,power_law_1.2,0.05560960173606873
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,7168,2048,8,256,16,16,balanced,2.7735093434651694
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,7168,2048,8,256,16,16,power_law_1.2,0.05910400152206421
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,7168,2048,8,256,16,16,power_law_1.2,0.06102399826049805
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,7168,2048,8,256,16,16,power_law_1.2,0.0624064028263092
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,7168,2048,8,256,16,16,power_law_1.2,0.06386560201644897
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,7168,2048,8,256,16,16,power_law_1.2,0.06538879871368408
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,7168,2048,8,256,16,16,power_law_1.2,0.06691200137138367
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,7168,2048,8,256,16,16,power_law_1.2,0.06911360025405884
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,7168,2048,8,256,16,16,power_law_1.2,0.07286400198936463
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,7168,2048,8,256,16,16,power_law_1.2,0.07722240090370178
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,7168,2048,8,256,16,16,power_law_1.2,0.08428159952163697
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,7168,2048,8,256,16,16,power_law_1.2,0.09070720076560974
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,7168,2048,8,256,16,16,power_law_1.2,0.09364479780197144
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,7168,2048,8,256,16,16,power_law_1.2,0.11115520000457764
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,7168,2048,8,256,16,16,power_law_1.2,0.13048319816589354
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,256,16,16,balanced,3.602229436238607
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,7168,2048,8,256,16,16,power_law_1.2,0.16268160343170165
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,7168,2048,8,256,16,16,power_law_1.2,0.1854464054107666
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,7168,2048,8,256,16,16,power_law_1.2,0.2364799976348877
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,7168,2048,8,256,16,16,power_law_1.2,0.30436480045318604
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,7168,2048,8,256,16,16,power_law_1.2,0.40839037895202634
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,7168,2048,8,256,16,16,power_law_1.2,0.5707583904266358
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,7168,2048,8,256,32,8,balanced,0.05499200026194254
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,7168,2048,8,256,16,16,power_law_1.2,0.7965760231018066
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,7168,2048,8,256,32,8,balanced,0.05421333511670431
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,7168,2048,8,256,16,16,power_law_1.2,1.1233280181884766
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,7168,2048,8,256,32,8,balanced,0.05585066477457682
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,7168,2048,8,256,16,16,power_law_1.2,0.05783680081367493
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,7168,2048,8,256,32,8,balanced,0.060271998246510826
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,7168,2048,8,256,16,16,power_law_1.2,1.3072896003723145
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,7168,2048,8,256,32,8,balanced,0.0774186650911967
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,7168,2048,8,256,16,16,power_law_1.2,0.0636352002620697
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,7168,2048,8,256,32,8,balanced,0.09086400270462036
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,7168,2048,8,256,16,16,power_law_1.2,2.1916223526000977
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,7168,2048,8,256,16,16,power_law_1.2,0.04892799854278564
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,7168,2048,8,256,32,8,balanced,0.09011733531951904
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,7168,2048,8,256,16,16,power_law_1.2,0.05173119902610779
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,7168,2048,8,256,32,8,balanced,0.09268800417582194
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,7168,2048,8,256,16,16,power_law_1.2,4.338227081298828
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,7168,2048,8,256,32,8,balanced,0.09237866600354512
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,7168,2048,8,256,16,16,power_law_1.2,0.055795198678970336
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,7168,2048,8,256,32,8,balanced,0.09386666615804036
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,7168,2048,8,256,16,16,power_law_1.2,0.06106240153312683
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,7168,2048,8,256,32,8,balanced,0.09056533376375835
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,7168,2048,8,256,16,16,power_law_1.2,0.06613119840621948
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,7168,2048,8,256,32,8,balanced,0.09274133046468098
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,7168,2048,8,256,16,16,power_law_1.2,0.06651520133018493
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,7168,2048,8,256,32,8,balanced,0.09390399853388469
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,7168,2048,8,256,16,16,power_law_1.2,0.06796799898147583
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,7168,2048,8,256,32,8,balanced,0.09491200248400371
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,7168,2048,8,256,16,16,power_law_1.2,0.06971520185470581
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,7168,2048,8,256,32,8,balanced,0.10317867000897725
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,7168,2048,8,256,16,16,power_law_1.2,0.07221760153770447
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,7168,2048,8,256,32,8,balanced,0.10046399633089702
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,7168,2048,8,256,16,16,power_law_1.2,0.07621759772300721
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,7168,2048,8,256,16,16,power_law_1.2,0.07880319952964783
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,7168,2048,8,256,32,8,balanced,0.10547199845314026
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,7168,2048,8,256,16,16,power_law_1.2,0.08521599769592285
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,7168,2048,8,256,32,8,balanced,0.11076266566912334
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,7168,2048,8,256,16,16,power_law_1.2,0.09219840168952942
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,7168,2048,8,256,32,8,balanced,0.12288533647855122
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,7168,2048,8,256,32,8,balanced,0.04740266501903534
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,7168,2048,8,256,16,16,power_law_1.2,0.09644160270690919
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,7168,2048,8,256,32,8,balanced,0.048021331429481506
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,7168,2048,8,256,32,8,balanced,0.1402079959710439
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,7168,2048,8,256,16,16,power_law_1.2,0.12057600021362305
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,7168,2048,8,256,32,8,balanced,0.04934399823347727
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,7168,2048,8,256,32,8,balanced,0.055125330885251365
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,7168,2048,8,256,32,8,balanced,0.06705066561698914
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,7168,2048,8,256,32,8,balanced,0.15788267056147257
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,7168,2048,8,256,16,16,power_law_1.2,0.13982080221176146
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,7168,2048,8,256,32,8,balanced,0.07941333452860515
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,7168,2048,8,256,32,8,balanced,0.0795360008875529
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,7168,2048,8,256,32,8,balanced,0.1962826649347941
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,7168,2048,8,256,32,8,balanced,0.07906666894753774
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,256,16,16,power_law_1.2,0.15217920541763305
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,7168,2048,8,256,32,8,balanced,0.07944533228874207
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,256,16,16,power_law_1.2,0.20653440952301025
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,7168,2048,8,256,32,8,balanced,0.08037866652011871
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,7168,2048,8,256,32,8,balanced,0.08290133376916249
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,256,16,16,power_law_1.2,0.25360000133514404
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,7168,2048,8,256,32,8,balanced,0.239029328028361
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,7168,2048,8,256,32,8,balanced,0.08360000451405843
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,7168,2048,8,256,32,8,balanced,0.08498133222262065
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,256,16,16,power_law_1.2,0.36784000396728517
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,7168,2048,8,256,32,8,balanced,0.08686932921409607
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,256,16,16,power_law_1.2,0.47253122329711916
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,7168,2048,8,256,32,8,balanced,0.09330667058626811
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,7168,2048,8,256,32,8,balanced,0.32445865869522095
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,7168,2048,8,256,32,8,balanced,0.09630933403968811
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,7168,2048,8,256,32,8,balanced,0.10100799798965454
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,256,16,16,power_law_1.2,0.7577983856201171
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,7168,2048,8,256,32,8,balanced,0.1143946647644043
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,256,16,16,power_law_1.2,0.8830400466918945
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,7168,2048,8,256,32,8,balanced,0.12803199887275696
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,256,16,16,power_law_1.2,1.532761573791504
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,7168,2048,8,256,32,8,power_law_1.01,0.058483201265335086
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,7168,2048,8,256,32,8,balanced,0.41813866297403973
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,7168,2048,8,256,32,8,balanced,0.15037866433461508
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,256,16,16,power_law_1.2,1.6793920516967773
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,7168,2048,8,256,32,8,power_law_1.01,0.06239359974861145
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,7168,2048,8,256,32,8,balanced,0.1753973364830017
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,7168,2048,8,256,32,8,power_law_1.01,0.055212801694869994
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,256,16,16,power_law_1.2,2.174163246154785
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,7168,2048,8,256,32,8,power_law_1.01,0.061408001184463504
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,7168,2048,8,256,32,8,balanced,0.2241386572519938
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,7168,2048,8,256,32,8,power_law_1.01,0.06785280108451844
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,256,16,16,power_law_1.2,3.344441604614258
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,7168,2048,8,256,32,8,power_law_1.01,0.07411199808120728
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,7168,2048,8,256,32,8,balanced,0.5937920014063517
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,7168,2048,8,256,32,8,power_law_1.01,0.08952959775924682
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,7168,2048,8,256,32,8,balanced,0.2824959953625997
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,256,16,16,power_law_1.2,7.640249633789063
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,7168,2048,8,256,32,8,power_law_1.01,0.07966079711914062
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,7168,2048,8,256,32,8,power_law_1.01,0.0795199990272522
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,7168,2048,8,256,32,8,balanced,0.3903306722640991
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,7168,2048,8,256,32,8,power_law_1.01,0.08341119885444641
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,7168,2048,8,256,32,8,power_law_1.01,0.09583359956741333
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,7168,2048,8,256,32,8,power_law_1.01,0.10038399696350098
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,7168,2048,8,256,32,8,power_law_1.01,0.09886720180511474
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,7168,2048,8,256,32,8,balanced,0.7327786286671957
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,7168,2048,8,256,32,8,balanced,0.5021440188090006
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,7168,2048,8,256,32,8,power_law_1.01,0.10104960203170776
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,7168,2048,8,256,32,8,power_law_1.01,0.05321599841117859
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,7168,2048,8,256,32,8,power_law_1.01,0.11228799819946289
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,7168,2048,8,256,32,8,power_law_1.01,0.056531202793121335
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,7168,2048,8,256,32,8,power_law_1.01,0.11271040439605713
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,7168,2048,8,256,32,8,power_law_1.01,0.10654720067977905
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,7168,2048,8,256,32,8,power_law_1.01,0.052716797590255736
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,7168,2048,8,256,32,8,balanced,0.729973316192627
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,7168,2048,8,256,32,8,power_law_1.01,0.12676479816436767
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,7168,2048,8,256,32,8,power_law_1.01,0.05608320236206055
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,7168,2048,8,256,32,8,power_law_1.01,0.13224320411682128
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,7168,2048,8,256,32,8,power_law_1.01,0.06188160181045532
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,7168,2048,8,256,32,8,power_law_1.01,0.17623039484024047
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,7168,2048,8,256,32,8,power_law_1.01,0.0654528021812439
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,7168,2048,8,256,32,8,balanced,0.940778652826945
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,7168,2048,8,256,32,8,power_law_1.01,0.07400959730148315
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,7168,2048,8,256,32,8,power_law_1.01,0.1739456057548523
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,7168,2048,8,256,32,8,power_law_1.01,0.2526144027709961
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,7168,2048,8,256,32,8,power_law_1.01,0.07279999852180481
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,7168,2048,8,256,32,8,power_law_1.01,0.07504640221595764
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,7168,2048,8,256,32,8,power_law_1.01,0.29030399322509765
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,7168,2048,8,256,32,8,balanced,0.9156213601430258
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,7168,2048,8,256,32,8,power_law_1.01,0.0759872019290924
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,7168,2048,8,256,32,8,power_law_1.01,0.40589442253112795
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,7168,2048,8,256,32,8,power_law_1.01,0.07863680124282837
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,7168,2048,8,256,32,8,power_law_1.01,0.4916224002838135
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,7168,2048,8,256,32,8,power_law_1.01,0.08195199966430664
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,7168,2048,8,256,32,8,power_law_1.01,0.7715583801269531
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,7168,2048,8,256,32,8,power_law_1.01,0.08823040127754211
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,7168,2048,8,256,32,8,power_law_1.01,0.9729023933410644
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,7168,2048,8,256,32,8,power_law_1.01,0.09410560131072998
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,7168,2048,8,256,32,8,power_law_1.01,1.146828842163086
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,7168,2048,8,256,32,8,power_law_1.01,0.102566397190094
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,7168,2048,8,256,32,8,power_law_1.01,1.896294403076172
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,7168,2048,8,256,32,8,power_law_1.01,0.1102463960647583
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,7168,2048,8,256,32,8,power_law_1.01,0.106387197971344
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,7168,2048,8,256,32,8,power_law_1.01,3.6810367584228514
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,7168,2048,8,256,32,8,balanced,1.1664160092671711
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,7168,2048,8,256,32,8,power_law_1.01,0.12378879785537719
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,7168,2048,8,256,32,8,balanced,1.3872747421264648
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,7168,2048,8,256,32,8,power_law_1.01,0.14085760116577148
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,7168,2048,8,256,32,8,power_law_1.01,0.17423360347747802
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,7168,2048,8,256,32,8,power_law_1.01,0.19994239807128905
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,7168,2048,8,256,32,8,power_law_1.01,0.27375359535217286
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,7168,2048,8,256,32,8,power_law_1.01,0.3243072032928467
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,7168,2048,8,256,32,8,power_law_1.01,0.44181118011474607
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,7168,2048,8,256,32,8,power_law_1.01,0.604582405090332
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,7168,2048,8,256,32,8,power_law_1.01,0.8840895652770996
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,7168,2048,8,256,32,8,power_law_1.01,1.1179648399353028
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,7168,2048,8,256,32,8,power_law_1.01,1.407091236114502
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,7168,2048,8,256,32,8,balanced,1.769290606180827
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,7168,2048,8,256,32,8,power_law_1.01,2.170822334289551
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,7168,2048,8,256,32,8,power_law_1.01,4.251481628417968
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,7168,2048,8,256,32,8,power_law_1.2,0.060864001512527466
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,7168,2048,8,256,32,8,power_law_1.2,0.06087679862976074
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,7168,2048,8,256,32,8,power_law_1.2,0.055283200740814206
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,7168,2048,8,256,32,8,power_law_1.2,0.06218240261077881
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,7168,2048,8,256,32,8,power_law_1.2,0.06922879815101624
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,7168,2048,8,256,32,8,power_law_1.2,0.0689408004283905
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,7168,2048,8,256,32,8,power_law_1.2,0.08229759931564332
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,7168,2048,8,256,32,8,power_law_1.2,0.08505600094795226
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,7168,2048,8,256,32,8,power_law_1.2,0.08426880240440368
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,7168,2048,8,256,32,8,power_law_1.2,0.08751999735832214
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,7168,2048,8,256,32,8,balanced,2.6808961232503257
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,7168,2048,8,256,32,8,power_law_1.2,0.09692800045013428
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,7168,2048,8,256,32,8,power_law_1.2,0.09968640208244324
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,7168,2048,8,256,32,8,power_law_1.2,0.10218240022659301
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,7168,2048,8,256,32,8,power_law_1.2,0.10324480533599853
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,7168,2048,8,256,32,8,power_law_1.2,0.11626880168914795
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,7168,2048,8,256,32,8,power_law_1.2,0.11967359781265259
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,7168,2048,8,256,32,8,power_law_1.2,0.10933120250701904
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,7168,2048,8,256,32,8,power_law_1.2,0.13007359504699706
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,7168,2048,8,256,32,8,power_law_1.2,0.14563839435577391
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,7168,2048,8,256,32,8,power_law_1.2,0.18143359422683716
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,7168,2048,8,256,32,8,power_law_1.2,0.1863487958908081
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,7168,2048,8,256,32,8,balanced,3.508319854736328
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,7168,2048,8,256,32,8,power_law_1.2,0.27948799133300783
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,7168,2048,8,256,32,8,power_law_1.2,0.31848959922790526
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,7168,2048,8,256,32,8,power_law_1.2,0.44060797691345216
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,7168,2048,8,256,32,8,power_law_1.2,0.5757247924804687
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,7168,2048,8,256,32,8,power_law_1.2,0.8217023849487305
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,7168,2048,8,256,32,8,power_law_1.2,1.2027775764465332
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,7168,2048,8,256,32,8,power_law_1.2,1.3884544372558594
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,7168,2048,8,256,32,8,power_law_1.2,0.0531328022480011
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,7168,2048,8,256,32,8,power_law_1.2,2.193062400817871
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,7168,2048,8,256,32,8,power_law_1.2,0.05549439787864685
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,7168,2048,8,256,32,8,power_law_1.2,4.270316696166992
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,7168,2048,8,256,32,8,power_law_1.2,0.05021439790725708
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,7168,2048,8,256,32,8,power_law_1.2,0.0541375994682312
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,7168,2048,8,256,32,8,power_law_1.2,0.05985280275344849
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,7168,2048,8,256,32,8,power_law_1.2,0.06170880198478699
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,7168,2048,8,256,32,8,power_law_1.2,0.0729088008403778
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,7168,2048,8,256,32,8,power_law_1.2,0.07322239875793457
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,7168,2048,8,256,32,8,power_law_1.2,0.07493759989738465
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,7168,2048,8,256,32,8,power_law_1.2,0.07377279996871948
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,7168,2048,8,256,32,8,power_law_1.2,0.08007680177688599
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,7168,2048,8,256,32,8,power_law_1.2,0.0841152012348175
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,7168,2048,8,256,32,8,power_law_1.2,0.08715519905090333
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,7168,2048,8,256,32,8,power_law_1.2,0.09452800154685974
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,7168,2048,8,256,32,8,power_law_1.2,0.10194560289382934
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,7168,2048,8,256,32,8,power_law_1.2,0.11168639659881592
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,7168,2048,8,256,32,8,power_law_1.2,0.11007360219955445
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,7168,2048,8,256,32,8,power_law_1.2,0.1312064051628113
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,7168,2048,8,256,32,8,power_law_1.2,0.14333440065383912
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,7168,2048,8,256,32,8,power_law_1.2,0.17813119888305665
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,7168,2048,8,256,32,8,power_law_1.2,0.20974719524383545
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,7168,2048,8,256,32,8,power_law_1.2,0.2872512102127075
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,7168,2048,8,256,32,8,power_law_1.2,0.35155200958251953
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,7168,2048,8,256,32,8,power_law_1.2,0.5267583847045898
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,2048,768,8,128,2,128,balanced,0.03417066733042399
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,7168,2048,8,256,32,8,power_law_1.2,0.6299200057983398
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,7168,2048,8,256,32,8,power_law_1.2,0.9147456169128418
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,2048,768,8,128,2,128,balanced,0.03475199888149897
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,2048,768,8,128,2,128,balanced,0.03453866640726725
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,7168,2048,8,256,32,8,power_law_1.2,1.2957504272460938
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,2048,768,8,128,2,128,balanced,0.03566933423280716
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,2048,768,8,128,2,128,balanced,0.03705599904060364
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,7168,2048,8,256,32,8,power_law_1.2,1.510655975341797
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,2048,768,8,128,2,128,balanced,0.037871999045213066
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,7168,2048,8,256,32,8,power_law_1.2,2.6191104888916015
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,2048,768,8,128,2,128,balanced,0.036517334481080375
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,2048,768,8,128,2,128,balanced,0.03822933385769526
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,7168,2048,8,256,32,8,power_law_1.2,5.1204673767089846
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,2048,768,8,128,2,128,balanced,0.03806933263937632
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,2048,768,8,128,2,128,balanced,0.038378665844599404
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,2048,768,8,128,2,128,balanced,0.03919466584920883
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,2048,768,8,128,2,128,balanced,0.03760000069936117
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,2048,768,8,128,2,128,balanced,0.03788266579310099
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,2048,768,8,128,2,128,balanced,0.03266666581233343
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,2048,768,8,128,2,128,balanced,0.0378560001651446
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,2048,768,8,128,2,128,balanced,0.033376000821590424
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,2048,768,8,128,2,128,balanced,0.041749333341916404
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,2048,768,8,128,2,128,balanced,0.032602667808532715
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,2048,768,8,128,2,128,balanced,0.04095999896526337
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,2048,768,8,128,2,128,balanced,0.03437866767247518
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,2048,768,8,128,2,128,balanced,0.03975466638803482
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,2048,768,8,128,2,128,balanced,0.03521066655715307
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,2048,768,8,128,2,128,balanced,0.03623999903599421
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,2048,768,8,128,2,128,balanced,0.04041066765785217
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,2048,768,8,128,2,128,balanced,0.03783999880154928
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,2048,768,8,128,2,128,balanced,0.042021334171295166
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,2048,768,8,128,2,128,balanced,0.0371573343873024
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,2048,768,8,128,2,128,balanced,0.035317334036032356
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,2048,768,8,128,2,128,balanced,0.042447999119758606
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,2048,768,8,128,2,128,balanced,0.03827200084924698
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,2048,768,8,128,2,128,balanced,0.036517334481080375
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,2048,768,8,128,2,128,balanced,0.043061330914497375
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,2048,768,8,128,2,128,balanced,0.036303999523321785
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,2048,768,8,128,2,128,balanced,0.023242667317390442
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,2048,768,8,128,2,128,balanced,0.0377866675456365
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,2048,768,8,128,2,128,balanced,0.05053333441416422
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,2048,768,8,128,2,128,balanced,0.02293333411216736
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,2048,768,8,128,2,128,balanced,0.03955733279387156
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,2048,768,8,128,2,128,balanced,0.023168000082174938
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,2048,768,8,128,2,128,balanced,0.0403413325548172
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,2048,768,8,128,2,128,balanced,0.02422400067249934
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,2048,768,8,128,2,128,power_law_1.01,0.03265919983386993
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,2048,768,8,128,2,128,balanced,0.05217066903909048
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,2048,768,8,128,2,128,balanced,0.03982933362325033
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,2048,768,8,128,2,128,balanced,0.02533866713444392
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,2048,768,8,128,2,128,power_law_1.01,0.032902398705482484
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,2048,768,8,128,2,128,balanced,0.026341333985328674
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,2048,768,8,128,2,128,balanced,0.04146133363246918
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,2048,768,8,128,2,128,power_law_1.01,0.03391999900341034
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,2048,768,8,128,2,128,balanced,0.026352000733216602
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,2048,768,8,128,2,128,balanced,0.04298666616280874
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,2048,768,8,128,2,128,balanced,0.026250667870044708
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,2048,768,8,128,2,128,power_law_1.01,0.0349375993013382
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,2048,768,8,128,2,128,balanced,0.06914666791756947
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,2048,768,8,128,2,128,balanced,0.026394667724768322
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,2048,768,8,128,2,128,balanced,0.04322666426499685
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,2048,768,8,128,2,128,power_law_1.01,0.03540480136871338
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,2048,768,8,128,2,128,balanced,0.027119999130566914
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,2048,768,8,128,2,128,balanced,0.04595733185609182
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,2048,768,8,128,2,128,balanced,0.02731200059254964
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,2048,768,8,128,2,128,power_law_1.01,0.03685120046138764
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,2048,768,8,128,2,128,power_law_1.01,0.030956798791885377
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,2048,768,8,128,2,128,balanced,0.027850667635599773
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,2048,768,8,128,2,128,power_law_1.01,0.036320000886917114
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,2048,768,8,128,2,128,balanced,0.04855999847253164
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,2048,768,8,128,2,128,balanced,0.028688001135985058
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,2048,768,8,128,2,128,balanced,0.0775679995616277
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,2048,768,8,128,2,128,power_law_1.01,0.03073279857635498
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,2048,768,8,128,2,128,power_law_1.01,0.0371071994304657
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,2048,768,8,128,2,128,balanced,0.028789333999156952
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,2048,768,8,128,2,128,power_law_1.01,0.03049600124359131
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,2048,768,8,128,2,128,power_law_1.01,0.035148799419403076
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,2048,768,8,128,2,128,balanced,0.06285866598288219
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,2048,768,8,128,2,128,balanced,0.03123733401298523
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,2048,768,8,128,2,128,power_law_1.01,0.03244799971580505
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,2048,768,8,128,2,128,power_law_1.01,0.03511039912700653
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,2048,768,8,128,2,128,balanced,0.030378667016824085
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,2048,768,8,128,2,128,power_law_1.01,0.033344000577926636
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,2048,768,8,128,2,128,power_law_1.01,0.03528960049152374
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,2048,768,8,128,2,128,balanced,0.07176533341407776
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,2048,768,8,128,2,128,power_law_1.01,0.034355199337005614
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,2048,768,8,128,2,128,power_law_1.01,0.03589119911193848
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,2048,768,8,128,2,128,power_law_1.01,0.036262398958206175
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,2048,768,8,128,2,128,balanced,0.1042133371035258
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,2048,768,8,128,2,128,power_law_1.01,0.03521920144557953
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,2048,768,8,128,2,128,power_law_1.01,0.03638400137424469
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,2048,768,8,128,2,128,balanced,0.03149333347876867
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,2048,768,8,128,2,128,power_law_1.01,0.03534719944000244
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,2048,768,8,128,2,128,balanced,0.09455999732017517
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,2048,768,8,128,2,128,power_law_1.01,0.03477759957313538
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,2048,768,8,128,2,128,power_law_1.01,0.0367935985326767
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,2048,768,8,128,2,128,balanced,0.03312533348798752
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,2048,768,8,128,2,128,power_law_1.01,0.036601600050926206
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,2048,768,8,128,2,128,power_law_1.01,0.04206080138683319
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,2048,768,8,128,2,128,balanced,0.032501332461833954
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,2048,768,8,128,2,128,power_law_1.01,0.03594880104064942
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,2048,768,8,128,2,128,power_law_1.01,0.0406464010477066
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,2048,768,8,128,2,128,power_law_1.01,0.035622400045394895
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,2048,768,8,128,2,128,power_law_1.01,0.0463808000087738
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,2048,768,8,128,2,128,balanced,0.11157866319020589
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,2048,768,8,128,2,128,power_law_1.01,0.03596160113811493
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,2048,768,8,128,2,128,power_law_1.01,0.05057280063629151
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,2048,768,8,128,2,128,balanced,0.12010666728019714
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,2048,768,8,128,2,128,power_law_1.01,0.03619199991226196
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,2048,768,8,128,2,128,power_law_1.01,0.06346880197525025
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,2048,768,8,128,2,128,balanced,0.03674133370320002
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,2048,768,8,128,2,128,power_law_1.01,0.03774079978466034
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,2048,768,8,128,2,128,power_law_1.01,0.07132800221443177
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,2048,768,8,128,2,128,balanced,0.03721600025892258
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,2048,768,8,128,2,128,power_law_1.01,0.03896960020065308
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,2048,768,8,128,2,128,power_law_1.01,0.09037439823150635
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,2048,768,8,128,2,128,power_law_1.01,0.04154239892959595
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,2048,768,8,128,2,128,power_law_1.01,0.11594239473342896
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,2048,768,8,128,2,128,power_law_1.01,0.02162559926509857
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,2048,768,8,128,2,128,balanced,0.14868266383806863
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,2048,768,8,128,2,128,power_law_1.01,0.15889279842376708
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,2048,768,8,128,2,128,power_law_1.01,0.046854400634765626
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,2048,768,8,128,2,128,power_law_1.01,0.02160000056028366
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,2048,768,8,128,2,128,power_law_1.01,0.04880639910697937
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,2048,768,8,128,2,128,balanced,0.042863999803860985
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,2048,768,8,128,2,128,power_law_1.01,0.2042367935180664
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,2048,768,8,128,2,128,power_law_1.01,0.02167679965496063
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,2048,768,8,128,2,128,power_law_1.01,0.05859839916229248
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,2048,768,8,128,2,128,power_law_1.01,0.27871360778808596
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,2048,768,8,128,2,128,power_law_1.01,0.02364159971475601
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,2048,768,8,128,2,128,power_law_1.01,0.07118719816207886
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,2048,768,8,128,2,128,balanced,0.04717333118120829
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,2048,768,8,128,2,128,power_law_1.01,0.37718400955200193
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,2048,768,8,128,2,128,balanced,0.1453439990679423
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,2048,768,8,128,2,128,power_law_1.01,0.023974399268627166
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,2048,768,8,128,2,128,power_law_1.01,0.09354879856109619
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,2048,768,8,128,2,128,power_law_1.01,0.4936255931854248
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,2048,768,8,128,2,128,power_law_1.01,0.024883200228214265
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,2048,768,8,128,2,128,power_law_1.01,0.1124735951423645
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,2048,768,8,128,2,128,power_law_1.01,0.7931583881378174
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,2048,768,8,128,2,128,power_law_1.01,0.02503040134906769
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,2048,768,8,128,2,128,power_law_1.01,0.1802240014076233
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,2048,768,8,128,2,128,balanced,0.18337599436442056
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,2048,768,8,128,2,128,power_law_1.01,0.025670400261878966
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,2048,768,8,128,2,128,power_law_1.01,0.2060159921646118
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,2048,768,8,128,2,128,power_law_1.01,1.6470912933349608
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,2048,768,8,128,2,128,power_law_1.01,0.025497600436210632
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,2048,768,8,128,2,128,power_law_1.01,0.2876607894897461
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,2048,768,8,128,2,128,power_law_1.01,0.025830399990081788
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,2048,768,8,128,2,128,balanced,0.05824000140031179
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,2048,768,8,128,2,128,power_law_1.01,0.4111231803894043
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,2048,768,8,128,2,128,power_law_1.01,0.026707199215888978
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,2048,768,8,128,2,128,power_law_1.01,0.5259647846221924
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,2048,768,8,128,2,128,power_law_1.01,0.026694399118423463
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,2048,768,8,128,2,128,power_law_1.01,0.027481600642204285
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,2048,768,8,128,2,128,power_law_1.01,0.8556735992431641
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,2048,768,8,128,2,128,power_law_1.01,0.028505599498748778
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,2048,768,8,128,2,128,power_law_1.2,0.034092798829078674
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,2048,768,8,128,2,128,power_law_1.01,1.6697599411010742
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,2048,768,8,128,2,128,balanced,0.06814399858315785
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,2048,768,8,128,2,128,power_law_1.01,0.030726400017738343
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,2048,768,8,128,2,128,balanced,0.21958933273951212
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,2048,768,8,128,2,128,power_law_1.2,0.033990401029586795
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,2048,768,8,128,2,128,power_law_1.01,0.032390400767326355
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,2048,768,8,128,2,128,power_law_1.2,0.03446399867534637
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,2048,768,8,128,2,128,balanced,0.2134666641553243
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,2048,768,8,128,2,128,power_law_1.2,0.03576320111751556
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,2048,768,8,128,2,128,power_law_1.2,0.03601920008659363
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,2048,768,8,128,2,128,power_law_1.2,0.03731200098991394
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,2048,768,8,128,2,128,power_law_1.01,0.037088000774383546
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,2048,768,8,128,2,128,power_law_1.2,0.03681280016899109
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,2048,768,8,128,2,128,power_law_1.01,0.044863998889923096
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,2048,768,8,128,2,128,power_law_1.2,0.03705599904060364
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,2048,768,8,128,2,128,power_law_1.2,0.036985599994659425
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,2048,768,8,128,2,128,power_law_1.01,0.04756479859352112
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,2048,768,8,128,2,128,power_law_1.2,0.03877759873867035
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,2048,768,8,128,2,128,power_law_1.2,0.036025598645210266
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,2048,768,8,128,2,128,power_law_1.2,0.03580799996852875
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,2048,768,8,128,2,128,balanced,0.09040000041325887
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,2048,768,8,128,2,128,power_law_1.2,0.037561601400375365
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,2048,768,8,128,2,128,power_law_1.01,0.0572160005569458
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,2048,768,8,128,2,128,power_law_1.2,0.03800959885120392
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,2048,768,8,128,2,128,power_law_1.01,0.0648576021194458
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,2048,768,8,128,2,128,power_law_1.2,0.04385280013084412
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,2048,768,8,128,2,128,power_law_1.2,0.03076480031013489
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,2048,768,8,128,2,128,power_law_1.2,0.04015359878540039
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,2048,768,8,128,2,128,power_law_1.01,0.07842559814453125
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,2048,768,8,128,2,128,power_law_1.2,0.04379520118236542
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,2048,768,8,128,2,128,power_law_1.2,0.030713599920272828
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,2048,768,8,128,2,128,power_law_1.2,0.055289602279663085
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,2048,768,8,128,2,128,power_law_1.01,0.10679039955139161
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,2048,768,8,128,2,128,power_law_1.2,0.03051519989967346
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,2048,768,8,128,2,128,balanced,0.32849599917729694
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,2048,768,8,128,2,128,power_law_1.2,0.05868160128593445
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,2048,768,8,128,2,128,power_law_1.2,0.032678401470184325
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,2048,768,8,128,2,128,power_law_1.2,0.07023360133171082
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,2048,768,8,128,2,128,power_law_1.2,0.03333759903907776
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,2048,768,8,128,2,128,power_law_1.2,0.09290239810943604
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,2048,768,8,128,2,128,power_law_1.01,0.13026560544967652
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,2048,768,8,128,2,128,power_law_1.2,0.12784639596939087
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,2048,768,8,128,2,128,power_law_1.2,0.03410559892654419
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,2048,768,8,128,2,128,power_law_1.2,0.16972800493240356
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,2048,768,8,128,2,128,power_law_1.2,0.03592320084571839
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,2048,768,8,128,2,128,power_law_1.2,0.22254080772399903
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,2048,768,8,128,2,128,power_law_1.01,0.19485440254211425
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,2048,768,8,128,2,128,balanced,0.10915199915568034
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,2048,768,8,128,2,128,power_law_1.2,0.03594880104064942
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,2048,768,8,128,2,128,power_law_1.2,0.32799999713897704
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,2048,768,8,128,2,128,power_law_1.2,0.0348800003528595
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,2048,768,8,128,2,128,power_law_1.2,0.47342720031738283
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,2048,768,8,128,2,128,power_law_1.2,0.03562879860401154
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,2048,768,8,128,2,128,power_law_1.2,0.6055552005767822
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,2048,768,8,128,2,128,power_law_1.01,0.25016961097717283
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,2048,768,8,128,2,128,power_law_1.2,0.03632639944553375
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,2048,768,8,128,2,128,power_law_1.2,0.74966402053833
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,2048,768,8,128,2,128,power_law_1.2,0.0354559987783432
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,2048,768,8,128,2,128,power_law_1.2,1.1875519752502441
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,2048,768,8,128,2,128,power_law_1.2,0.03607040047645569
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,2048,768,8,128,2,128,power_law_1.01,0.3484992027282715
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,2048,768,8,128,2,128,power_law_1.2,2.389331245422363
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,2048,768,8,128,2,128,power_law_1.2,0.03612160086631775
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,2048,768,8,128,2,128,power_law_1.2,0.04188799858093262
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,2048,768,8,128,2,128,power_law_1.2,0.04035199880599975
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,2048,768,8,128,2,128,power_law_1.2,0.04123519957065582
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,2048,768,8,128,2,128,power_law_1.2,0.04842239916324616
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,2048,768,8,128,2,128,balanced,0.39339733123779297
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,2048,768,8,128,2,128,power_law_1.01,0.3692095994949341
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,2048,768,8,128,2,128,balanced,0.12924266854921976
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,2048,768,8,128,2,128,power_law_1.2,0.054655998945236206
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,2048,768,8,128,2,128,power_law_1.01,0.6834559917449952
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,2048,768,8,128,2,128,power_law_1.2,0.07083520293235779
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,2048,768,8,128,2,128,power_law_1.2,0.08869119882583618
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,2048,768,8,128,2,128,power_law_1.01,1.3476927757263184
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,2048,768,8,128,2,128,power_law_1.2,0.12072319984436035
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,2048,768,8,128,2,128,power_law_1.2,0.15119999647140503
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,2048,768,8,128,2,128,power_law_1.2,0.21815040111541747
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,2048,768,8,128,2,128,power_law_1.2,0.2636607885360718
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,2048,768,8,128,2,128,power_law_1.2,0.4070720195770264
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,2048,768,8,128,2,128,power_law_1.2,0.5685440063476562
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,2048,768,8,128,2,128,balanced,0.6194506486256918
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,2048,768,8,128,2,128,power_law_1.2,0.7015232086181641
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,2048,768,8,128,2,128,balanced,0.18936532735824585
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,2048,768,8,128,2,128,power_law_1.2,1.1018112182617188
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,2048,768,8,128,2,128,power_law_1.2,2.1633344650268556
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,2048,768,8,128,2,128,balanced,0.35312533378601074
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,2048,768,8,128,2,128,power_law_1.2,0.021568000316619873
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,2048,768,8,128,2,128,power_law_1.2,0.021881599724292756
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,2048,768,8,128,2,128,power_law_1.2,0.021932800114154816
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,2048,768,8,128,4,64,balanced,0.021754667162895203
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,2048,768,8,128,2,128,power_law_1.2,0.02361599951982498
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,2048,768,8,128,2,128,power_law_1.2,0.02420479953289032
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,2048,768,8,128,4,64,balanced,0.023738667368888855
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,2048,768,8,128,2,128,power_law_1.2,0.024908800423145295
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,2048,768,8,128,4,64,balanced,0.02164799968401591
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,2048,768,8,128,4,64,balanced,0.023045333723227184
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,2048,768,8,128,2,128,power_law_1.2,0.025312000513076784
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,2048,768,8,128,4,64,balanced,0.023445333043734234
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,2048,768,8,128,2,128,power_law_1.2,0.025856000185012818
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,2048,768,8,128,4,64,balanced,0.024832000335057575
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,2048,768,8,128,2,128,power_law_1.2,0.025696000456809996
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,2048,768,8,128,4,64,balanced,0.02532800038655599
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,2048,768,8,128,2,128,power_law_1.2,0.026073598861694337
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,2048,768,8,128,4,64,balanced,0.025055999557177227
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,2048,768,8,128,2,128,power_law_1.2,0.026867198944091796
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,2048,768,8,128,4,64,balanced,0.02455466737349828
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,2048,768,8,128,2,128,power_law_1.2,0.027167999744415285
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,2048,768,8,128,4,64,balanced,0.025008000433444977
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,2048,768,8,128,4,64,balanced,0.025786665578683216
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,2048,768,8,128,2,128,power_law_1.2,0.027910399436950683
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,2048,768,8,128,4,64,balanced,0.026202666262785595
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,2048,768,8,128,2,128,power_law_1.2,0.029388800263404846
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,2048,768,8,128,4,64,balanced,0.02665599932273229
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,2048,768,8,128,2,128,power_law_1.2,0.032927998900413515
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,2048,768,8,128,4,64,balanced,0.033285332222779594
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,2048,768,8,128,2,128,power_law_1.2,0.0328000009059906
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,2048,768,8,128,4,64,balanced,0.03488533447186152
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,2048,768,8,128,4,64,balanced,0.03487999985615412
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,2048,768,8,128,2,128,power_law_1.2,0.04095360040664673
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,2048,768,8,128,4,64,balanced,0.03568000098069509
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,2048,768,8,128,2,128,power_law_1.2,0.05107839703559876
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,2048,768,8,128,4,64,balanced,0.03708266715208689
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,2048,768,8,128,2,128,power_law_1.2,0.05798400044441223
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,2048,768,8,128,4,64,balanced,0.03787733366092046
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,2048,768,8,128,4,64,balanced,0.030245333909988403
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,2048,768,8,128,2,128,power_law_1.2,0.07138559818267823
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,2048,768,8,128,4,64,balanced,0.03985599925120672
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,2048,768,8,128,4,64,balanced,0.028592000404993694
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,2048,768,8,128,2,128,power_law_1.2,0.09224960207939148
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,2048,768,8,128,4,64,balanced,0.028618666032950085
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,2048,768,8,128,4,64,balanced,0.04058666775623957
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,2048,768,8,128,4,64,balanced,0.03070399910211563
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,2048,768,8,128,2,128,power_law_1.2,0.12010879516601562
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,2048,768,8,128,4,64,balanced,0.03257599969704946
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,2048,768,8,128,4,64,balanced,0.04284266630808512
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,2048,768,8,128,2,128,power_law_1.2,0.14935679435729982
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,2048,768,8,128,4,64,balanced,0.03332799921433131
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,2048,768,8,128,4,64,balanced,0.03275733441114426
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,2048,768,8,128,4,64,balanced,0.033045334120591484
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,2048,768,8,128,4,64,balanced,0.04603200157483419
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,2048,768,8,128,4,64,balanced,0.033146666983763375
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,2048,768,8,128,2,128,power_law_1.2,0.20905599594116211
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,2048,768,8,128,4,64,balanced,0.03369600077470144
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,2048,768,8,128,4,64,balanced,0.034160000582536064
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,2048,768,8,128,2,128,power_law_1.2,0.2961280107498169
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,2048,768,8,128,4,64,balanced,0.034373333056767784
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,2048,768,8,128,4,64,balanced,0.05726400017738342
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,2048,768,8,128,4,64,power_law_1.01,0.02160640060901642
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,2048,768,8,128,4,64,balanced,0.0349386657277743
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,2048,768,8,128,4,64,balanced,0.03548266738653183
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,2048,768,8,128,4,64,power_law_1.01,0.023097600042819976
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,2048,768,8,128,2,128,power_law_1.2,0.4026303768157959
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,2048,768,8,128,4,64,balanced,0.03826133410135905
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,2048,768,8,128,4,64,power_law_1.01,0.021196800470352172
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,2048,768,8,128,4,64,balanced,0.0377866675456365
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,2048,768,8,128,4,64,power_law_1.01,0.022592000663280487
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,2048,768,8,128,2,128,power_law_1.2,0.5148416042327881
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,2048,768,8,128,4,64,balanced,0.05909333129723867
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,2048,768,8,128,4,64,balanced,0.022085333863894146
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,2048,768,8,128,4,64,balanced,0.0390133336186409
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,2048,768,8,128,4,64,power_law_1.01,0.023296000063419343
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,2048,768,8,128,4,64,balanced,0.022143999735514324
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,2048,768,8,128,4,64,power_law_1.01,0.024057599902153014
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,2048,768,8,128,4,64,balanced,0.03957333415746689
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,2048,768,8,128,4,64,balanced,0.022154666483402252
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,2048,768,8,128,2,128,power_law_1.2,0.6223040103912354
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,2048,768,8,128,4,64,power_law_1.01,0.02447360008955002
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,2048,768,8,128,4,64,balanced,0.040634666879971824
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,2048,768,8,128,4,64,balanced,0.023381332556406658
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,2048,768,8,128,4,64,power_law_1.01,0.025433599948883057
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,2048,768,8,128,2,128,power_law_1.2,0.9459327697753906
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,2048,768,8,128,4,64,balanced,0.024864000578721363
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,2048,768,8,128,4,64,power_law_1.01,0.028230398893356323
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,2048,768,8,128,4,64,balanced,0.042992000778516136
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,2048,768,8,128,4,64,balanced,0.0775679995616277
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,2048,768,8,128,4,64,balanced,0.025807999074459076
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,2048,768,8,128,2,128,power_law_1.2,1.941472053527832
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,2048,768,8,128,4,64,power_law_1.01,0.02961919903755188
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,2048,768,8,128,4,64,balanced,0.025989333788553875
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,2048,768,8,128,4,64,balanced,0.04558399816354116
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,2048,768,8,128,4,64,balanced,0.025914666553338368
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,2048,768,8,128,4,64,power_law_1.01,0.031193599104881287
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,2048,768,8,128,4,64,balanced,0.02609066665172577
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,2048,768,8,128,4,64,power_law_1.01,0.03157120048999786
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,2048,768,8,128,4,64,balanced,0.055439998706181846
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,2048,768,8,128,4,64,balanced,0.02672533442576726
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,2048,768,8,128,4,64,power_law_1.01,0.031718400120735166
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,2048,768,8,128,4,64,power_law_1.01,0.03056640028953552
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,2048,768,8,128,4,64,balanced,0.027215999861558277
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,2048,768,8,128,4,64,power_law_1.01,0.03297280073165894
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,2048,768,8,128,4,64,balanced,0.027221334477265675
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,2048,768,8,128,4,64,power_law_1.01,0.028934401273727418
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,2048,768,8,128,4,64,balanced,0.06488533318042755
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,2048,768,8,128,4,64,power_law_1.01,0.0349375993013382
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,2048,768,8,128,4,64,balanced,0.07986666758855183
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,2048,768,8,128,4,64,power_law_1.01,0.02905600070953369
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,2048,768,8,128,4,64,balanced,0.028016000986099243
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,2048,768,8,128,4,64,power_law_1.01,0.031020799279212953
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,2048,768,8,128,4,64,power_law_1.01,0.03619840145111084
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,2048,768,8,128,4,64,power_law_1.01,0.03163520097732544
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,2048,768,8,128,4,64,balanced,0.028378665447235107
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,2048,768,8,128,4,64,power_law_1.01,0.022124800086021423
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,2048,768,8,128,4,64,power_law_1.01,0.03726719915866852
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,2048,768,8,128,4,64,power_law_1.01,0.03277440071105957
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,2048,768,8,128,4,64,balanced,0.08482666810353597
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,2048,768,8,128,4,64,balanced,0.030453334252039593
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,2048,768,8,128,4,64,power_law_1.01,0.032313600182533264
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,2048,768,8,128,4,64,power_law_1.01,0.039340800046920775
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,2048,768,8,128,4,64,power_law_1.01,0.0216511994600296
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,2048,768,8,128,4,64,power_law_1.01,0.03293440043926239
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,2048,768,8,128,4,64,balanced,0.030106666187445324
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,2048,768,8,128,4,64,power_law_1.01,0.03313280045986176
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,2048,768,8,128,4,64,power_law_1.01,0.02202879935503006
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,2048,768,8,128,4,64,power_law_1.01,0.04420480132102966
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,2048,768,8,128,4,64,power_law_1.01,0.033241599798202515
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,2048,768,8,128,4,64,power_law_1.01,0.02398719936609268
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,2048,768,8,128,4,64,power_law_1.01,0.048179200291633605
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,2048,768,8,128,4,64,power_law_1.01,0.034016001224517825
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,2048,768,8,128,4,64,power_law_1.01,0.024383999407291412
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,2048,768,8,128,4,64,power_law_1.01,0.034668800234794614
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,2048,768,8,128,4,64,power_law_1.01,0.06149119734764099
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,2048,768,8,128,4,64,balanced,0.0969546635945638
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,2048,768,8,128,4,64,power_law_1.01,0.034771201014518735
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,2048,768,8,128,4,64,power_law_1.01,0.025363200902938844
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,2048,768,8,128,4,64,power_law_1.01,0.07006719708442688
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,2048,768,8,128,4,64,power_law_1.01,0.03640320003032684
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,2048,768,8,128,4,64,balanced,0.031343999008337654
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,2048,768,8,128,4,64,balanced,0.09248532851537068
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,2048,768,8,128,4,64,power_law_1.01,0.025676798820495606
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,2048,768,8,128,4,64,power_law_1.01,0.03893760144710541
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,2048,768,8,128,4,64,power_law_1.01,0.08296959996223449
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,2048,768,8,128,4,64,power_law_1.01,0.03994880020618439
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,2048,768,8,128,4,64,balanced,0.03363200028737386
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,2048,768,8,128,4,64,power_law_1.01,0.026118400692939758
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,2048,768,8,128,4,64,power_law_1.01,0.04163840115070343
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,2048,768,8,128,4,64,power_law_1.01,0.10981119871139526
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,2048,768,8,128,4,64,power_law_1.01,0.026208001375198364
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,2048,768,8,128,4,64,power_law_1.01,0.04695680141448975
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,2048,768,8,128,4,64,balanced,0.03270400067170461
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,2048,768,8,128,4,64,power_law_1.01,0.1175104022026062
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,2048,768,8,128,4,64,power_law_1.01,0.0462336003780365
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,2048,768,8,128,4,64,power_law_1.01,0.026348799467086792
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,2048,768,8,128,4,64,power_law_1.01,0.05246719717979431
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,2048,768,8,128,4,64,balanced,0.1273973286151886
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,2048,768,8,128,4,64,power_law_1.01,0.027001601457595826
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,2048,768,8,128,4,64,power_law_1.01,0.15567359924316407
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,2048,768,8,128,4,64,power_law_1.01,0.06261759996414185
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,2048,768,8,128,4,64,power_law_1.01,0.02768000066280365
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,2048,768,8,128,4,64,power_law_1.01,0.077811199426651
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,2048,768,8,128,4,64,power_law_1.01,0.1797760009765625
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,2048,768,8,128,4,64,power_law_1.01,0.09165440201759338
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,2048,768,8,128,4,64,power_law_1.01,0.028204798698425293
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,2048,768,8,128,4,64,balanced,0.03712533414363861
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,2048,768,8,128,4,64,power_law_1.01,0.22537600994110107
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,2048,768,8,128,4,64,power_law_1.01,0.13200639486312865
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,2048,768,8,128,4,64,power_law_1.01,0.030022400617599487
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,2048,768,8,128,4,64,power_law_1.01,0.13999359607696532
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,2048,768,8,128,4,64,power_law_1.01,0.2996543884277344
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,2048,768,8,128,4,64,power_law_1.01,0.03256320059299469
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,2048,768,8,128,4,64,balanced,0.038346665600935616
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,2048,768,8,128,4,64,power_law_1.01,0.21653759479522705
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,2048,768,8,128,4,64,power_law_1.2,0.021542400121688843
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,2048,768,8,128,4,64,power_law_1.01,0.03324800133705139
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,2048,768,8,128,4,64,power_law_1.01,0.2783744096755981
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,2048,768,8,128,4,64,power_law_1.01,0.6440063953399658
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,2048,768,8,128,4,64,power_law_1.2,0.022988800704479218
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,2048,768,8,128,4,64,power_law_1.01,0.31727359294891355
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,2048,768,8,128,4,64,balanced,0.15228266517321268
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,2048,768,8,128,4,64,power_law_1.2,0.021196800470352172
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,2048,768,8,128,4,64,balanced,0.04509866734345754
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,2048,768,8,128,4,64,power_law_1.01,0.03619840145111084
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,2048,768,8,128,4,64,power_law_1.2,0.022540800273418427
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,2048,768,8,128,4,64,power_law_1.01,0.4997375965118408
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,2048,768,8,128,4,64,balanced,0.12482133507728577
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,2048,768,8,128,4,64,power_law_1.2,0.02316800057888031
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,2048,768,8,128,4,64,power_law_1.01,0.0436928004026413
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,2048,768,8,128,4,64,power_law_1.01,1.0438528060913086
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,2048,768,8,128,4,64,power_law_1.2,0.024172799289226533
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,2048,768,8,128,4,64,power_law_1.01,0.04677119851112366
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,2048,768,8,128,4,64,balanced,0.04972266654173533
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,2048,768,8,128,4,64,power_law_1.2,0.02418559938669205
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,2048,768,8,128,4,64,power_law_1.2,0.026144000887870788
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,2048,768,8,128,4,64,power_law_1.2,0.029452800750732422
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,2048,768,8,128,4,64,power_law_1.01,0.05451520085334778
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,2048,768,8,128,4,64,power_law_1.2,0.03047040104866028
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,2048,768,8,128,4,64,power_law_1.01,0.06540799736976624
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,2048,768,8,128,4,64,power_law_1.2,0.031167998909950256
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,2048,768,8,128,4,64,balanced,0.17877866824467978
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,2048,768,8,128,4,64,power_law_1.2,0.031302401423454286
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,2048,768,8,128,4,64,power_law_1.01,0.08370559811592101
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,2048,768,8,128,4,64,power_law_1.2,0.032051199674606325
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,2048,768,8,128,4,64,balanced,0.0637600024541219
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,2048,768,8,128,4,64,power_law_1.01,0.10243840217590332
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,2048,768,8,128,4,64,power_law_1.2,0.034092798829078674
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,2048,768,8,128,4,64,power_law_1.2,0.03580799996852875
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,2048,768,8,128,4,64,power_law_1.2,0.03632639944553375
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,2048,768,8,128,4,64,power_law_1.01,0.12854399681091308
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,2048,768,8,128,4,64,power_law_1.2,0.03752320110797882
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,2048,768,8,128,4,64,balanced,0.07575466732184093
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,2048,768,8,128,4,64,power_law_1.01,0.17926399707794188
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,2048,768,8,128,4,64,power_law_1.2,0.041254401206970215
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,2048,768,8,128,4,64,power_law_1.2,0.046214398741722104
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,2048,768,8,128,4,64,power_law_1.2,0.05691519975662231
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,2048,768,8,128,4,64,power_law_1.2,0.06220160126686096
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,2048,768,8,128,4,64,power_law_1.01,0.2613823890686035
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,2048,768,8,128,4,64,power_law_1.2,0.09580159783363343
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,2048,768,8,128,4,64,power_law_1.2,0.0986303985118866
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,2048,768,8,128,4,64,power_law_1.2,0.15727360248565675
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,2048,768,8,128,4,64,power_law_1.2,0.15914880037307738
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,2048,768,8,128,4,64,power_law_1.01,0.31934080123901365
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,2048,768,8,128,4,64,balanced,0.10136533776919048
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,2048,768,8,128,4,64,power_law_1.2,0.2759040117263794
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,2048,768,8,128,4,64,balanced,0.2622879942258199
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,2048,768,8,128,4,64,power_law_1.2,0.3211456060409546
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,2048,768,8,128,4,64,power_law_1.2,0.3393856048583984
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,2048,768,8,128,4,64,power_law_1.2,0.5873216152191162
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,2048,768,8,128,4,64,power_law_1.2,1.3017279624938964
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,2048,768,8,128,4,64,power_law_1.01,0.4061439990997314
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,2048,768,8,128,4,64,power_law_1.01,0.6301951885223389
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,2048,768,8,128,4,64,balanced,0.21416000525156656
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,2048,768,8,128,4,64,power_law_1.01,1.329599952697754
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,2048,768,8,128,4,64,balanced,0.1251520017782847
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,2048,768,8,128,4,64,balanced,0.14903466900189719
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,2048,768,8,128,4,64,balanced,0.48259198665618896
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,2048,768,8,128,4,64,power_law_1.2,0.030649599432945252
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,2048,768,8,128,4,64,power_law_1.2,0.02928000092506409
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,2048,768,8,128,4,64,balanced,0.22061334053675333
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,2048,768,8,128,4,64,power_law_1.2,0.02844800055027008
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,2048,768,8,128,4,64,power_law_1.2,0.031027200818061828
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,2048,768,8,128,4,64,power_law_1.2,0.03162879943847656
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,2048,768,8,128,4,64,power_law_1.2,0.032678401470184325
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,2048,768,8,128,4,64,power_law_1.2,0.03238399922847748
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,2048,768,8,128,4,64,power_law_1.2,0.03268480002880096
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,2048,768,8,128,4,64,power_law_1.2,0.03404799997806549
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,2048,768,8,128,4,64,power_law_1.2,0.03301759958267212
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,2048,768,8,128,4,64,power_law_1.2,0.033983999490737916
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,2048,768,8,128,4,64,power_law_1.2,0.03463680148124695
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,2048,768,8,128,4,64,power_law_1.2,0.03532800078392029
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,2048,768,8,128,4,64,power_law_1.2,0.036473599076271054
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,2048,768,8,128,4,64,power_law_1.2,0.03912320137023926
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,2048,768,8,128,4,64,power_law_1.2,0.04044800102710724
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,2048,768,8,128,4,64,power_law_1.2,0.04366720020771027
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,2048,768,8,128,4,64,power_law_1.2,0.04798080027103424
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,2048,768,8,128,4,64,power_law_1.2,0.04959999918937683
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,2048,768,8,128,4,64,power_law_1.2,0.058355200290679934
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,2048,768,8,128,4,64,power_law_1.2,0.07177600264549255
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,2048,768,8,128,4,64,power_law_1.2,0.09633280038833618
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,2048,768,8,128,4,64,power_law_1.2,0.11487360000610351
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,2048,768,8,128,4,64,power_law_1.2,0.159334397315979
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,2048,768,8,128,4,64,power_law_1.2,0.1869439959526062
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,2048,768,8,128,4,64,power_law_1.2,0.2738624095916748
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,2048,768,8,128,4,64,balanced,0.4371466636657715
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,2048,768,8,128,4,64,power_law_1.2,0.42062082290649416
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,2048,768,8,128,4,64,power_law_1.2,0.4795328140258789
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,4096,1536,8,128,2,128,balanced,0.06389866769313812
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,2048,768,8,128,4,64,power_law_1.2,0.7473408222198487
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,4096,1536,8,128,2,128,balanced,0.05991999804973602
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,2048,768,8,128,4,64,power_law_1.2,1.808518409729004
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,4096,1536,8,128,2,128,balanced,0.060592000683148704
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,4096,1536,8,128,2,128,balanced,0.06397333244482677
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,2048,768,8,128,4,64,power_law_1.2,0.022047999501228332
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,4096,1536,8,128,2,128,balanced,0.06339199841022491
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,2048,768,8,128,4,64,power_law_1.2,0.021913599967956544
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,4096,1536,8,128,2,128,balanced,0.06790400048096974
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,2048,768,8,128,4,64,power_law_1.2,0.02210559993982315
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,4096,1536,8,128,2,128,balanced,0.06321066617965698
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,4096,1536,8,128,2,128,balanced,0.056688000758488975
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,2048,768,8,128,4,64,power_law_1.2,0.02369280010461807
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,4096,1536,8,128,2,128,balanced,0.059578667084376015
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,2048,768,8,128,4,64,power_law_1.2,0.024665600061416625
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,4096,1536,8,128,2,128,balanced,0.06473066906134288
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,2048,768,8,128,4,64,power_law_1.2,0.02542079985141754
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,4096,1536,8,128,2,128,balanced,0.06366933385531108
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,2048,768,8,128,4,64,power_law_1.2,0.02588160037994385
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,4096,1536,8,128,2,128,balanced,0.06017066538333893
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,2048,768,8,128,4,64,power_law_1.2,0.026060798764228822
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,4096,1536,8,128,2,128,balanced,0.06540266672770183
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,2048,768,8,128,4,64,power_law_1.2,0.026144000887870788
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,4096,1536,8,128,2,128,balanced,0.05889600018660227
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,2048,768,8,128,4,64,power_law_1.2,0.0263808012008667
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,4096,1536,8,128,2,128,balanced,0.06696000198523204
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,2048,768,8,128,4,64,power_law_1.2,0.027039998769760133
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,2048,768,8,128,4,64,power_law_1.2,0.027871999144554137
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,4096,1536,8,128,2,128,balanced,0.06534400085608165
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,2048,768,8,128,4,64,power_law_1.2,0.028748801350593566
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,4096,1536,8,128,2,128,balanced,0.06203199923038483
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,2048,768,8,128,4,64,power_law_1.2,0.030854400992393494
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,4096,1536,8,128,2,128,balanced,0.06277866661548615
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,2048,768,8,128,4,64,power_law_1.2,0.033657601475715636
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,4096,1536,8,128,2,128,balanced,0.04602666695912679
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,4096,1536,8,128,2,128,balanced,0.06171200176080068
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,2048,768,8,128,4,64,power_law_1.2,0.0359360009431839
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,4096,1536,8,128,2,128,balanced,0.04634666442871094
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,4096,1536,8,128,2,128,balanced,0.04629333317279816
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,4096,1536,8,128,2,128,balanced,0.06072533130645752
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,4096,1536,8,128,2,128,balanced,0.0487413356701533
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,2048,768,8,128,4,64,power_law_1.2,0.03925760090351105
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,4096,1536,8,128,2,128,balanced,0.05941333373387655
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,4096,1536,8,128,2,128,balanced,0.049029335379600525
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,2048,768,8,128,4,64,power_law_1.2,0.04653440117835998
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,4096,1536,8,128,2,128,balanced,0.05031999945640564
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,2048,768,8,128,4,64,power_law_1.2,0.05438719987869263
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,4096,1536,8,128,2,128,power_law_1.01,0.06105599999427795
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,4096,1536,8,128,2,128,balanced,0.09103999535242717
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,4096,1536,8,128,2,128,balanced,0.04971733192602793
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,4096,1536,8,128,2,128,power_law_1.01,0.059084802865982056
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,4096,1536,8,128,2,128,balanced,0.05012266834576925
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,4096,1536,8,128,2,128,balanced,0.026522666215896606
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,4096,1536,8,128,2,128,power_law_1.01,0.06234880089759827
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,4096,1536,8,128,2,128,balanced,0.04754666487375895
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,2048,768,8,128,4,64,power_law_1.2,0.07119359970092773
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,4096,1536,8,128,2,128,power_law_1.01,0.06240000128746033
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,4096,1536,8,128,2,128,balanced,0.08737599849700928
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,4096,1536,8,128,2,128,balanced,0.026687999566396076
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,4096,1536,8,128,2,128,power_law_1.01,0.06270080208778381
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,4096,1536,8,128,2,128,balanced,0.05115733544031779
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,4096,1536,8,128,2,128,balanced,0.02665599932273229
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,2048,768,8,128,4,64,power_law_1.2,0.07651839852333069
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,4096,1536,8,128,2,128,power_law_1.01,0.0637440025806427
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,4096,1536,8,128,2,128,balanced,0.04852266609668732
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,4096,1536,8,128,2,128,balanced,0.027658666173617046
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,4096,1536,8,128,2,128,power_law_1.01,0.058745598793029784
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,2048,768,8,128,4,64,power_law_1.2,0.11189759969711303
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,4096,1536,8,128,2,128,balanced,0.050383999943733215
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,4096,1536,8,128,2,128,power_law_1.01,0.06105599999427795
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,4096,1536,8,128,2,128,balanced,0.02867199977238973
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,4096,1536,8,128,2,128,balanced,0.1150933305422465
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,4096,1536,8,128,2,128,power_law_1.01,0.05913599729537964
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,4096,1536,8,128,2,128,balanced,0.029738667110602062
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,4096,1536,8,128,2,128,balanced,0.047824000318845115
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,2048,768,8,128,4,64,power_law_1.2,0.12788480520248413
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,4096,1536,8,128,2,128,power_law_1.01,0.05941759943962097
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,4096,1536,8,128,2,128,balanced,0.030080000559488933
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,4096,1536,8,128,2,128,power_law_1.01,0.05731840133666992
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,4096,1536,8,128,2,128,balanced,0.048565333088239036
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,4096,1536,8,128,2,128,power_law_1.01,0.05414400100708008
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,4096,1536,8,128,2,128,balanced,0.02998399982849757
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,4096,1536,8,128,2,128,balanced,0.05407466491063436
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,4096,1536,8,128,2,128,power_law_1.01,0.052851200103759766
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,4096,1536,8,128,2,128,balanced,0.030181333422660828
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,2048,768,8,128,4,64,power_law_1.2,0.24369919300079346
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,4096,1536,8,128,2,128,power_law_1.01,0.048844799399375916
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,4096,1536,8,128,2,128,balanced,0.052373334765434265
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,4096,1536,8,128,2,128,balanced,0.13102400302886963
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,4096,1536,8,128,2,128,balanced,0.03052799900372823
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,4096,1536,8,128,2,128,power_law_1.01,0.050892800092697144
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,2048,768,8,128,4,64,power_law_1.2,0.27038719654083254
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,4096,1536,8,128,2,128,balanced,0.051541333397229515
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,4096,1536,8,128,2,128,balanced,0.031040000418821972
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,4096,1536,8,128,2,128,power_law_1.01,0.06801279783248901
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,4096,1536,8,128,2,128,power_law_1.01,0.07420160174369812
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,4096,1536,8,128,2,128,balanced,0.031189332405726116
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,4096,1536,8,128,2,128,balanced,0.0566293348868688
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,2048,768,8,128,4,64,power_law_1.2,0.4348480224609375
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,4096,1536,8,128,2,128,power_law_1.01,0.08983039855957031
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,4096,1536,8,128,2,128,balanced,0.032101333141326904
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,4096,1536,8,128,2,128,power_law_1.01,0.09935359954833985
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,4096,1536,8,128,2,128,balanced,0.05778133372465769
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,4096,1536,8,128,2,128,balanced,0.032399999598662056
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,4096,1536,8,128,2,128,power_law_1.01,0.13344000577926635
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,2048,768,8,128,4,64,power_law_1.2,0.5988160133361816
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,4096,1536,8,128,2,128,power_law_1.01,0.16153600215911865
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,4096,1536,8,128,2,128,balanced,0.03503466645876566
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,4096,1536,8,128,2,128,balanced,0.18819733460744223
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,4096,1536,8,128,2,128,power_law_1.01,0.2251199960708618
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,4096,1536,8,128,2,128,balanced,0.065610667069753
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,4096,1536,8,128,2,128,power_law_1.01,0.04286080002784729
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,4096,1536,8,128,2,128,balanced,0.034202667574087776
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,4096,1536,8,128,2,128,power_law_1.01,0.27429120540618895
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,4096,1536,8,128,2,128,power_law_1.01,0.4455296039581299
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,4096,1536,8,128,2,128,balanced,0.07414400080839793
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,4096,1536,8,128,2,128,power_law_1.01,0.04131200015544891
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,2048,768,8,128,4,64,power_law_1.2,0.7402112007141113
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,4096,1536,8,128,2,128,power_law_1.01,0.5143424034118652
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,4096,1536,8,128,2,128,power_law_1.01,0.04199039936065674
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,4096,1536,8,128,2,128,power_law_1.01,0.9252415657043457
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,2048,768,8,128,4,64,power_law_1.2,1.1164671897888183
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,4096,1536,8,128,2,128,power_law_1.01,0.045132800936698914
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,4096,1536,8,128,2,128,balanced,0.10136533776919048
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,4096,1536,8,128,2,128,power_law_1.01,1.1182016372680663
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,4096,1536,8,128,2,128,balanced,0.03504000107447306
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,4096,1536,8,128,2,128,power_law_1.01,0.04408319890499115
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,4096,1536,8,128,2,128,power_law_1.01,1.6113855361938476
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,2048,768,8,128,4,64,power_law_1.2,2.9355072021484374
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,4096,1536,8,128,2,128,power_law_1.01,0.04559360146522522
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,4096,1536,8,128,2,128,balanced,0.037903999288876854
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,4096,1536,8,128,2,128,power_law_1.01,2.770591926574707
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,4096,1536,8,128,2,128,balanced,0.11097600062688191
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,4096,1536,8,128,2,128,power_law_1.01,0.04787200093269348
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,4096,1536,8,128,2,128,balanced,0.23083732525507608
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,4096,1536,8,128,2,128,balanced,0.03807999938726425
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,4096,1536,8,128,2,128,power_law_1.01,5.474803161621094
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,4096,1536,8,128,2,128,power_law_1.01,0.047891199588775635
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,4096,1536,8,128,2,128,power_law_1.01,0.04761599898338318
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,4096,1536,8,128,2,128,balanced,0.14987732966740927
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,4096,1536,8,128,2,128,power_law_1.01,0.048332801461219786
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,4096,1536,8,128,2,128,power_law_1.01,0.045664000511169436
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,4096,1536,8,128,2,128,balanced,0.04420266548792521
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,4096,1536,8,128,2,128,power_law_1.01,0.045465600490570066
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,4096,1536,8,128,2,128,power_law_1.01,0.04483200013637543
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,4096,1536,8,128,2,128,balanced,0.04822933177153269
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,4096,1536,8,128,2,128,balanced,0.1803306738535563
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,4096,1536,8,128,2,128,power_law_1.01,0.04405759871006012
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,4096,1536,8,128,2,128,power_law_1.01,0.046086400747299194
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,4096,1536,8,128,2,128,balanced,0.2858560085296631
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,4096,1536,8,128,2,128,power_law_1.01,0.05312640070915222
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,4096,1536,8,128,2,128,power_law_1.01,0.05809280276298523
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,4096,1536,8,128,2,128,power_law_1.01,0.07802240252494812
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,4096,1536,8,128,2,128,power_law_1.01,0.0803264021873474
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,4096,1536,8,128,2,128,balanced,0.05977066854635874
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,4096,1536,8,128,2,128,balanced,0.2545599937438965
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,4096,1536,8,128,2,128,power_law_1.01,0.10959999561309815
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,4096,1536,8,128,2,128,power_law_1.01,0.13313280344009398
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,4096,1536,8,128,2,128,power_law_1.01,0.18705919981002808
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,4096,1536,8,128,2,128,balanced,0.06701333324114482
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,4096,1536,8,128,2,128,power_law_1.01,0.2400831937789917
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,4096,1536,8,128,2,128,power_law_1.01,0.3210560083389282
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,4096,1536,8,128,2,128,power_law_1.01,0.49169278144836426
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,4096,1536,8,128,2,128,power_law_1.01,0.701913595199585
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,4096,1536,8,128,2,128,balanced,0.32157333691914874
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,4096,1536,8,128,2,128,power_law_1.01,0.8763520240783691
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,4096,1536,8,128,2,128,power_law_1.01,1.015436840057373
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,4096,1536,8,128,2,128,balanced,0.08493866523106892
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,4096,1536,8,128,2,128,balanced,0.4283039967219035
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,4096,1536,8,128,2,128,power_law_1.01,1.8246591567993165
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,4096,1536,8,128,2,128,power_law_1.01,3.847929763793945
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,4096,1536,8,128,2,128,power_law_1.01,0.025830399990081788
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,4096,1536,8,128,2,128,power_law_1.01,0.025990399718284606
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,4096,1536,8,128,2,128,balanced,0.3940533399581909
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,4096,1536,8,128,2,128,power_law_1.01,0.026015999913215637
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,4096,1536,8,128,2,128,power_law_1.01,0.027910399436950683
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,4096,1536,8,128,2,128,power_law_1.2,0.06093440055847168
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,4096,1536,8,128,2,128,balanced,0.09983467062314351
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,4096,1536,8,128,2,128,power_law_1.01,0.028307199478149414
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,4096,1536,8,128,2,128,power_law_1.01,0.029120001196861266
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,4096,1536,8,128,2,128,power_law_1.2,0.05931519865989685
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,4096,1536,8,128,2,128,power_law_1.01,0.029683199524879456
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,4096,1536,8,128,2,128,power_law_1.2,0.060211199522018435
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,4096,1536,8,128,2,128,power_law_1.01,0.029919999837875366
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,4096,1536,8,128,2,128,power_law_1.2,0.0609279990196228
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,4096,1536,8,128,2,128,power_law_1.01,0.029971200227737426
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,4096,1536,8,128,2,128,power_law_1.2,0.06122879981994629
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,4096,1536,8,128,2,128,power_law_1.01,0.030124801397323608
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,4096,1536,8,128,2,128,power_law_1.2,0.06343039870262146
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,4096,1536,8,128,2,128,power_law_1.01,0.03147520124912262
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,4096,1536,8,128,2,128,power_law_1.2,0.06188160181045532
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,4096,1536,8,128,2,128,power_law_1.01,0.03172479867935181
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,4096,1536,8,128,2,128,balanced,0.13522666692733765
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,4096,1536,8,128,2,128,power_law_1.2,0.05555199980735779
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,4096,1536,8,128,2,128,power_law_1.01,0.03225600123405457
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,4096,1536,8,128,2,128,power_law_1.2,0.05914880037307739
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,4096,1536,8,128,2,128,power_law_1.01,0.03586559891700745
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,4096,1536,8,128,2,128,power_law_1.2,0.061926400661468504
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,4096,1536,8,128,2,128,balanced,0.603925347328186
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,4096,1536,8,128,2,128,power_law_1.01,0.03800320029258728
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,4096,1536,8,128,2,128,power_law_1.2,0.05494400262832642
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,4096,1536,8,128,2,128,power_law_1.01,0.03994880020618439
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,4096,1536,8,128,2,128,power_law_1.2,0.054022401571273804
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,4096,1536,8,128,2,128,power_law_1.2,0.05360640287399292
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,4096,1536,8,128,2,128,power_law_1.01,0.05234559774398804
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,4096,1536,8,128,2,128,power_law_1.2,0.05100160241127014
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,4096,1536,8,128,2,128,power_law_1.01,0.06387199759483338
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,4096,1536,8,128,2,128,power_law_1.2,0.07429760098457336
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,4096,1536,8,128,2,128,power_law_1.2,0.07572479844093323
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,4096,1536,8,128,2,128,power_law_1.01,0.08244479894638061
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,4096,1536,8,128,2,128,balanced,0.16858667135238647
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,4096,1536,8,128,2,128,balanced,0.8216586907704672
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,4096,1536,8,128,2,128,power_law_1.2,0.07801600098609925
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,4096,1536,8,128,2,128,power_law_1.2,0.10399999618530273
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,4096,1536,8,128,2,128,power_law_1.01,0.09118080139160156
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,4096,1536,8,128,2,128,power_law_1.2,0.12710399627685548
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,4096,1536,8,128,2,128,power_law_1.01,0.11593600511550903
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,4096,1536,8,128,2,128,power_law_1.2,0.18888319730758668
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,4096,1536,8,128,2,128,power_law_1.2,0.2253887891769409
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,4096,1536,8,128,2,128,power_law_1.01,0.1379520058631897
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,4096,1536,8,128,2,128,power_law_1.2,0.3376895904541016
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,4096,1536,8,128,2,128,power_law_1.01,0.18989440202713012
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,4096,1536,8,128,2,128,power_law_1.2,0.47385601997375487
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,4096,1536,8,128,2,128,power_law_1.2,0.6838719844818115
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,4096,1536,8,128,2,128,power_law_1.2,0.8872575759887695
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,4096,1536,8,128,2,128,power_law_1.01,0.28448638916015623
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,4096,1536,8,128,2,128,power_law_1.2,1.4077568054199219
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,4096,1536,8,128,2,128,power_law_1.2,1.8985471725463867
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,4096,1536,8,128,2,128,balanced,0.20245865980784097
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,4096,1536,8,128,2,128,power_law_1.01,0.35047039985656736
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,4096,1536,8,128,2,128,power_law_1.2,2.436191940307617
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,4096,1536,8,128,2,128,power_law_1.01,0.5027135848999024
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,4096,1536,8,128,2,128,power_law_1.2,4.004691314697266
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,4096,1536,8,128,2,128,power_law_1.01,0.6082240104675293
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,4096,1536,8,128,2,128,power_law_1.2,7.973856353759766
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,4096,1536,8,128,2,128,balanced,1.1697973410288494
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,4096,1536,8,128,2,128,power_law_1.01,0.7668992042541504
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,4096,1536,8,128,2,128,power_law_1.01,1.4967359542846679
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,4096,1536,8,128,2,128,power_law_1.01,2.882054328918457
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,4096,1536,8,128,2,128,power_law_1.2,0.04490239918231964
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,4096,1536,8,128,2,128,balanced,0.3076159954071045
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,4096,1536,8,128,2,128,power_law_1.2,0.044787201285362246
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,4096,1536,8,128,2,128,power_law_1.2,0.04504320025444031
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,4096,1536,8,128,2,128,power_law_1.2,0.0471231997013092
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,4096,1536,8,128,2,128,power_law_1.2,0.04639999866485596
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,4096,1536,8,128,2,128,power_law_1.2,0.04836480021476745
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,4096,1536,8,128,2,128,power_law_1.2,0.04669440090656281
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,4096,1536,8,128,2,128,power_law_1.2,0.02566399872303009
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,4096,1536,8,128,2,128,power_law_1.2,0.04756479859352112
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,4096,1536,8,128,2,128,power_law_1.2,0.02588160037994385
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,4096,1536,8,128,2,128,power_law_1.2,0.04713599979877472
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,4096,1536,8,128,2,128,power_law_1.2,0.04734080135822296
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,4096,1536,8,128,2,128,power_law_1.2,0.02602880001068115
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,4096,1536,8,128,2,128,power_law_1.2,0.047007998824119566
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,4096,1536,8,128,2,128,power_law_1.2,0.027980801463127137
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,4096,1536,8,128,2,128,power_law_1.2,0.04661760032176972
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,4096,1536,8,128,2,128,power_law_1.2,0.04599039852619171
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,4096,1536,8,128,2,128,power_law_1.2,0.028352001309394838
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,4096,1536,8,128,2,128,power_law_1.2,0.04229120016098022
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,4096,1536,8,128,2,128,power_law_1.2,0.02919679880142212
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,4096,1536,8,128,2,128,power_law_1.2,0.055257600545883176
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,4096,1536,8,128,2,128,power_law_1.2,0.029676800966262816
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,4096,1536,8,128,2,128,power_law_1.2,0.05953279733657837
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,4096,1536,8,128,2,128,power_law_1.2,0.06832000017166137
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,4096,1536,8,128,2,128,power_law_1.2,0.029766398668289184
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,4096,1536,8,128,2,128,power_law_1.2,0.08256639838218689
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,4096,1536,8,128,2,128,power_law_1.2,0.02980479896068573
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,4096,1536,8,128,2,128,power_law_1.2,0.09864959716796876
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,4096,1536,8,128,2,128,power_law_1.2,0.14687360525131227
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,4096,1536,8,128,2,128,power_law_1.2,0.03048959970474243
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,4096,1536,8,128,2,128,power_law_1.2,0.172160005569458
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,4096,1536,8,128,2,128,power_law_1.2,0.03152639865875244
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,4096,1536,8,128,2,128,power_law_1.2,0.24257919788360596
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,4096,1536,8,128,2,128,power_law_1.2,0.03261440098285675
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,4096,1536,8,128,2,128,power_law_1.2,0.3230720043182373
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,4096,1536,8,128,2,128,power_law_1.2,0.03524479866027832
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,4096,1536,8,128,2,128,power_law_1.2,0.509606409072876
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,4096,1536,8,128,2,128,power_law_1.2,0.037484800815582274
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,4096,1536,8,128,2,128,power_law_1.2,0.6412864208221436
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,4096,1536,8,128,2,128,power_law_1.2,0.9201279640197754
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,4096,1536,8,128,2,128,power_law_1.2,0.043110400438308716
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,4096,1536,8,128,2,128,power_law_1.2,1.2793536186218262
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,4096,1536,8,128,2,128,power_law_1.2,0.0472896009683609
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,4096,1536,8,128,2,128,power_law_1.2,1.6044736862182618
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,4096,1536,8,128,2,128,power_law_1.2,2.580179214477539
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,4096,1536,8,128,2,128,power_law_1.2,0.06033279895782471
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,4096,1536,8,128,2,128,power_law_1.2,5.099449539184571
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,4096,1536,8,128,2,128,power_law_1.2,0.08208000063896179
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,4096,1536,8,128,2,128,balanced,0.6041813294092814
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,4096,1536,8,128,2,128,power_law_1.2,0.10977920293807983
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,4096,1536,8,128,4,64,balanced,0.033701332906881966
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,4096,1536,8,128,4,64,balanced,0.0334346666932106
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,4096,1536,8,128,2,128,power_law_1.2,0.13409919738769532
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,4096,1536,8,128,4,64,balanced,0.03305600086847941
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,4096,1536,8,128,2,128,power_law_1.2,0.18387839794158936
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,4096,1536,8,128,4,64,balanced,0.03435199956099192
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,4096,1536,8,128,4,64,balanced,0.03558400024970373
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,4096,1536,8,128,4,64,balanced,0.03339733431736628
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,4096,1536,8,128,2,128,power_law_1.2,0.24654080867767333
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,4096,1536,8,128,4,64,balanced,0.033413333197434746
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,4096,1536,8,128,2,128,power_law_1.2,0.34070401191711425
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,4096,1536,8,128,4,64,balanced,0.03331733246644338
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,4096,1536,8,128,4,64,balanced,0.03316266586383184
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,4096,1536,8,128,2,128,power_law_1.2,0.4488639831542969
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,4096,1536,8,128,4,64,balanced,0.033674667278925575
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,4096,1536,8,128,4,64,balanced,0.03398400048414866
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,4096,1536,8,128,4,64,balanced,0.03439466655254364
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,4096,1536,8,128,2,128,power_law_1.2,0.5512639999389648
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,4096,1536,8,128,4,64,balanced,0.03524799893299738
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,4096,1536,8,128,4,64,balanced,0.04106133431196213
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,4096,1536,8,128,2,128,power_law_1.2,0.7826623916625977
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,4096,1536,8,128,4,64,balanced,0.04249600072701772
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,4096,1536,8,128,4,64,balanced,0.042319998145103455
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,4096,1536,8,128,2,128,power_law_1.2,1.0485568046569824
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,4096,1536,8,128,4,64,balanced,0.04414933423201243
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,4096,1536,8,128,4,64,balanced,0.04610666632652283
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,4096,1536,8,128,2,128,power_law_1.2,1.2653759956359862
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,4096,1536,8,128,4,64,balanced,0.04626133541266123
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,4096,1536,8,128,2,128,power_law_1.2,2.0565631866455076
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,4096,1536,8,128,4,64,balanced,0.0497920016447703
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,4096,1536,8,128,4,64,balanced,0.03269333392381668
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,4096,1536,8,128,2,128,power_law_1.2,3.9707393646240234
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,4096,1536,8,128,4,64,balanced,0.03252266595760981
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,4096,1536,8,128,4,64,balanced,0.053077335158983864
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,4096,1536,8,128,4,64,balanced,0.03209600100914637
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,4096,1536,8,128,4,64,balanced,0.033770665526390076
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,4096,1536,8,128,4,64,balanced,0.03542399903138479
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,4096,1536,8,128,4,64,balanced,0.06772799789905548
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,4096,1536,8,128,4,64,balanced,0.03641066700220108
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,4096,1536,8,128,4,64,balanced,0.036271999279658
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,4096,1536,8,128,4,64,balanced,0.06390933195749919
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,4096,1536,8,128,4,64,balanced,0.036202666660149894
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,4096,1536,8,128,4,64,balanced,0.03659199923276901
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,4096,1536,8,128,4,64,balanced,0.03711999952793121
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,4096,1536,8,128,4,64,balanced,0.08201066652933757
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,4096,1536,8,128,4,64,balanced,0.03769599894682566
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,4096,1536,8,128,4,64,balanced,0.03811733424663544
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,4096,1536,8,128,4,64,balanced,0.03885866701602936
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,4096,1536,8,128,4,64,balanced,0.03973866750796636
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,4096,1536,8,128,4,64,balanced,0.042175998290379844
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,4096,1536,8,128,4,64,balanced,0.08339200417200725
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,4096,1536,8,128,4,64,balanced,0.0421013335386912
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,4096,1536,8,128,4,64,balanced,0.04375466704368591
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,4096,1536,8,128,4,64,balanced,0.04614933331807455
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,4096,1536,8,128,4,64,balanced,0.04880533119042715
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,4096,1536,8,128,4,64,balanced,0.05871999760468801
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,4096,1536,8,128,4,64,balanced,0.11275733510653178
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,4096,1536,8,128,4,64,balanced,0.06743999818960826
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,4096,1536,8,128,4,64,balanced,0.08721066514650981
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,4096,1536,8,128,4,64,power_law_1.01,0.03882879912853241
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,4096,1536,8,128,4,64,power_law_1.01,0.035359999537467955
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,4096,1536,8,128,4,64,balanced,0.09575466314951579
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,4096,1536,8,128,4,64,power_law_1.01,0.03221760094165802
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,4096,1536,8,128,4,64,balanced,0.1272053321202596
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,4096,1536,8,128,4,64,power_law_1.01,0.0335999995470047
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,4096,1536,8,128,4,64,power_law_1.01,0.03501439988613129
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,4096,1536,8,128,4,64,power_law_1.01,0.032671999931335446
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,4096,1536,8,128,4,64,power_law_1.01,0.03523840010166168
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,4096,1536,8,128,4,64,power_law_1.01,0.03429119884967804
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,4096,1536,8,128,4,64,balanced,0.12547199924786887
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,4096,1536,8,128,4,64,power_law_1.01,0.03708159923553467
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,4096,1536,8,128,4,64,power_law_1.01,0.035180801153182985
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,4096,1536,8,128,4,64,power_law_1.01,0.035488000512123107
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,4096,1536,8,128,4,64,balanced,0.02638400097688039
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,4096,1536,8,128,4,64,power_law_1.01,0.03229439854621887
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,4096,1536,8,128,4,64,power_law_1.01,0.03550080060958862
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,4096,1536,8,128,4,64,balanced,0.026191999514897663
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,4096,1536,8,128,4,64,power_law_1.01,0.032652801275253295
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,4096,1536,8,128,4,64,power_law_1.01,0.03598720133304596
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,4096,1536,8,128,4,64,balanced,0.026346666117509205
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,4096,1536,8,128,4,64,balanced,0.14542933305104574
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,4096,1536,8,128,4,64,power_law_1.01,0.03627519905567169
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,4096,1536,8,128,4,64,power_law_1.01,0.03606399893760681
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,4096,1536,8,128,4,64,balanced,0.02757333219051361
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,4096,1536,8,128,4,64,power_law_1.01,0.03668479919433594
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,4096,1536,8,128,4,64,power_law_1.01,0.03962239921092987
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,4096,1536,8,128,4,64,balanced,0.02922133356332779
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,4096,1536,8,128,4,64,balanced,0.1474240024884542
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,4096,1536,8,128,4,64,power_law_1.01,0.03898240029811859
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,4096,1536,8,128,4,64,power_law_1.01,0.0421887993812561
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,4096,1536,8,128,4,64,balanced,0.03028800090154012
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,4096,1536,8,128,4,64,power_law_1.01,0.049081599712371825
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,4096,1536,8,128,4,64,power_law_1.01,0.039366400241851805
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,4096,1536,8,128,4,64,balanced,0.03038399914900462
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,4096,1536,8,128,4,64,power_law_1.01,0.04017919898033142
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,4096,1536,8,128,4,64,power_law_1.01,0.05143679976463318
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,4096,1536,8,128,4,64,balanced,0.03035733352104823
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,4096,1536,8,128,4,64,balanced,0.20229333639144897
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,4096,1536,8,128,4,64,power_law_1.01,0.041510400176048276
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,4096,1536,8,128,4,64,power_law_1.01,0.053420799970626834
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,4096,1536,8,128,4,64,balanced,0.03051200012365977
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,4096,1536,8,128,4,64,power_law_1.01,0.04288640022277832
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,4096,1536,8,128,4,64,balanced,0.030896000564098358
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,4096,1536,8,128,4,64,power_law_1.01,0.04382080137729645
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,4096,1536,8,128,4,64,balanced,0.03146666785081228
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,4096,1536,8,128,4,64,power_law_1.01,0.044633600115776065
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,4096,1536,8,128,4,64,power_law_1.01,0.04561919867992401
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,4096,1536,8,128,4,64,balanced,0.03196266790231069
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,4096,1536,8,128,4,64,power_law_1.01,0.04696959853172302
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,4096,1536,8,128,4,64,power_law_1.01,0.045184001326560974
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,4096,1536,8,128,4,64,balanced,0.03253866732120514
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,4096,1536,8,128,4,64,power_law_1.01,0.061363202333450315
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,4096,1536,8,128,4,64,power_law_1.01,0.05111039876937866
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,4096,1536,8,128,4,64,balanced,0.03287466615438461
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,4096,1536,8,128,4,64,power_law_1.01,0.06207360029220581
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,4096,1536,8,128,4,64,power_law_1.01,0.06375679969787598
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,4096,1536,8,128,4,64,balanced,0.03610666592915853
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,4096,1536,8,128,4,64,power_law_1.01,0.08179200291633607
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,4096,1536,8,128,4,64,power_law_1.01,0.06627839803695679
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,4096,1536,8,128,4,64,balanced,0.2507680058479309
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,4096,1536,8,128,4,64,balanced,0.03515733281771342
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,4096,1536,8,128,4,64,power_law_1.01,0.09806720018386841
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,4096,1536,8,128,4,64,power_law_1.01,0.08497920036315917
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,4096,1536,8,128,4,64,power_law_1.01,0.1284160017967224
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,4096,1536,8,128,4,64,power_law_1.01,0.08970239758491516
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,4096,1536,8,128,4,64,balanced,0.2153279980023702
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,4096,1536,8,128,4,64,power_law_1.01,0.14226560592651366
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,4096,1536,8,128,4,64,power_law_1.01,0.1298624038696289
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,4096,1536,8,128,4,64,power_law_1.2,0.03369599878787995
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,4096,1536,8,128,4,64,power_law_1.01,0.1208448052406311
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,4096,1536,8,128,4,64,power_law_1.01,0.19150079488754274
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,4096,1536,8,128,4,64,balanced,0.03630933413902918
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,4096,1536,8,128,4,64,power_law_1.2,0.032620799541473386
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,4096,1536,8,128,4,64,power_law_1.01,0.1750656008720398
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,4096,1536,8,128,4,64,power_law_1.01,0.2419327974319458
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,4096,1536,8,128,4,64,power_law_1.2,0.03255679905414581
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,4096,1536,8,128,4,64,power_law_1.01,0.2517375946044922
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,4096,1536,8,128,4,64,balanced,0.039546666045983635
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,4096,1536,8,128,4,64,power_law_1.01,0.3440768003463745
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,4096,1536,8,128,4,64,power_law_1.2,0.034355199337005614
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,4096,1536,8,128,4,64,power_law_1.01,0.026752001047134398
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,4096,1536,8,128,4,64,power_law_1.2,0.03505919873714447
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,4096,1536,8,128,4,64,power_law_1.01,0.30547199249267576
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,4096,1536,8,128,4,64,power_law_1.01,0.4768832206726074
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,4096,1536,8,128,4,64,balanced,0.0399893323580424
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,4096,1536,8,128,4,64,power_law_1.2,0.03242239952087402
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,4096,1536,8,128,4,64,power_law_1.01,0.026035198569297792
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,4096,1536,8,128,4,64,balanced,0.30018667380015057
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,4096,1536,8,128,4,64,power_law_1.01,0.4022975921630859
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,4096,1536,8,128,4,64,power_law_1.01,0.5578368186950684
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,4096,1536,8,128,4,64,power_law_1.2,0.032601600885391234
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,4096,1536,8,128,4,64,power_law_1.01,0.026182401180267333
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,4096,1536,8,128,4,64,power_law_1.2,0.03969280123710632
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,4096,1536,8,128,4,64,power_law_1.01,0.4344831943511963
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,4096,1536,8,128,4,64,power_law_1.01,0.838368034362793
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,4096,1536,8,128,4,64,power_law_1.01,0.028204798698425293
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,4096,1536,8,128,4,64,power_law_1.2,0.04186240136623383
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,4096,1536,8,128,4,64,power_law_1.01,0.02863360047340393
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,4096,1536,8,128,4,64,power_law_1.2,0.04359039962291718
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,4096,1536,8,128,4,64,power_law_1.01,0.6625855922698974
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,4096,1536,8,128,4,64,power_law_1.01,1.931635284423828
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,4096,1536,8,128,4,64,power_law_1.2,0.04995200037956238
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,4096,1536,8,128,4,64,power_law_1.01,0.029606398940086365
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,4096,1536,8,128,4,64,balanced,0.0469706654548645
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,4096,1536,8,128,4,64,power_law_1.2,0.05551360249519348
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,4096,1536,8,128,4,64,power_law_1.01,0.03038719892501831
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,4096,1536,8,128,4,64,power_law_1.01,1.3820608139038086
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,4096,1536,8,128,4,64,power_law_1.2,0.06657919883728028
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,4096,1536,8,128,4,64,power_law_1.01,0.03051519989967346
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,4096,1536,8,128,4,64,power_law_1.2,0.04387840032577515
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,4096,1536,8,128,4,64,balanced,0.05150400102138519
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,4096,1536,8,128,4,64,power_law_1.01,0.030342400074005127
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,4096,1536,8,128,4,64,power_law_1.2,0.04552319943904877
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,4096,1536,8,128,4,64,power_law_1.2,0.046003198623657225
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,4096,1536,8,128,4,64,power_law_1.01,0.03080959916114807
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,4096,1536,8,128,4,64,power_law_1.2,0.05397760272026062
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,4096,1536,8,128,4,64,power_law_1.01,0.0319680005311966
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,4096,1536,8,128,4,64,power_law_1.2,0.07028480172157288
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,4096,1536,8,128,4,64,power_law_1.01,0.033344000577926636
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,4096,1536,8,128,4,64,power_law_1.2,0.0789247989654541
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,4096,1536,8,128,4,64,balanced,0.06451733410358429
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,4096,1536,8,128,4,64,power_law_1.2,0.10121599435806275
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,4096,1536,8,128,4,64,power_law_1.01,0.035020801424980166
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,4096,1536,8,128,4,64,power_law_1.2,0.149619197845459
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,4096,1536,8,128,4,64,power_law_1.01,0.03727999925613403
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,4096,1536,8,128,4,64,power_law_1.2,0.18010239601135253
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,4096,1536,8,128,4,64,power_law_1.01,0.0416128009557724
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,4096,1536,8,128,4,64,power_law_1.2,0.18528640270233154
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,4096,1536,8,128,4,64,balanced,0.07424533367156982
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,4096,1536,8,128,4,64,balanced,0.4532639980316162
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,4096,1536,8,128,4,64,power_law_1.2,0.2545727968215942
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,4096,1536,8,128,4,64,power_law_1.01,0.043084800243377686
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,4096,1536,8,128,4,64,power_law_1.2,0.31663360595703127
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,4096,1536,8,128,4,64,power_law_1.2,0.6189375877380371
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,4096,1536,8,128,4,64,power_law_1.01,0.04901120066642761
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,4096,1536,8,128,4,64,power_law_1.2,0.6432576179504395
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,4096,1536,8,128,4,64,power_law_1.01,0.06353920102119445
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,4096,1536,8,128,4,64,power_law_1.2,0.8031680107116699
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,4096,1536,8,128,4,64,power_law_1.2,0.03917439877986908
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,4096,1536,8,128,4,64,power_law_1.01,0.07960320115089417
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,4096,1536,8,128,4,64,power_law_1.2,1.0592127799987794
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,4096,1536,8,128,4,64,balanced,0.3810133139292399
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,4096,1536,8,128,4,64,power_law_1.2,0.03182080090045929
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,4096,1536,8,128,4,64,balanced,0.09648000200589497
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,4096,1536,8,128,4,64,power_law_1.2,3.212307357788086
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,4096,1536,8,128,4,64,power_law_1.2,0.03242239952087402
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,4096,1536,8,128,4,64,power_law_1.01,0.08887040019035339
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,4096,1536,8,128,4,64,power_law_1.2,0.034169599413871765
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,4096,1536,8,128,4,64,power_law_1.01,0.11421439647674561
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,4096,1536,8,128,4,64,power_law_1.2,0.034745600819587705
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,4096,1536,8,128,4,64,power_law_1.2,0.036160001158714296
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,4096,1536,8,128,4,64,power_law_1.01,0.13379199504852296
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,4096,1536,8,128,4,64,power_law_1.2,0.03550719916820526
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,4096,1536,8,128,4,64,power_law_1.01,0.19695359468460083
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,4096,1536,8,128,4,64,balanced,0.11513599753379822
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,4096,1536,8,128,4,64,power_law_1.2,0.03609600067138672
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,4096,1536,8,128,4,64,power_law_1.2,0.03633280098438263
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,4096,1536,8,128,4,64,power_law_1.01,0.2693759918212891
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,4096,1536,8,128,4,64,power_law_1.2,0.03666560053825378
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,4096,1536,8,128,4,64,power_law_1.2,0.03815680146217346
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,4096,1536,8,128,4,64,power_law_1.01,0.3348031997680664
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,4096,1536,8,128,4,64,power_law_1.2,0.0395583987236023
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,4096,1536,8,128,4,64,power_law_1.2,0.04014720022678375
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,4096,1536,8,128,4,64,power_law_1.2,0.041529598832130435
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,4096,1536,8,128,4,64,balanced,0.16024000446001688
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,4096,1536,8,128,4,64,power_law_1.01,0.48360958099365237
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,4096,1536,8,128,4,64,power_law_1.2,0.044435200095176694
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,4096,1536,8,128,4,64,power_law_1.2,0.04760960042476654
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,4096,1536,8,128,4,64,power_law_1.2,0.05123839974403381
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,4096,1536,8,128,4,64,power_law_1.2,0.06241919994354248
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,4096,1536,8,128,4,64,power_law_1.01,0.5972032070159912
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,4096,1536,8,128,4,64,power_law_1.2,0.07259520292282104
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,4096,1536,8,128,4,64,balanced,0.8607892990112305
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,4096,1536,8,128,4,64,power_law_1.01,0.7995903968811036
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,4096,1536,8,128,4,64,power_law_1.2,0.08269439935684204
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,4096,1536,8,128,4,64,power_law_1.01,1.18088960647583
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,4096,1536,8,128,4,64,power_law_1.2,0.11029119491577148
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,4096,1536,8,128,4,64,balanced,0.19954133033752441
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,4096,1536,8,128,4,64,power_law_1.01,2.6814912796020507
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,4096,1536,8,128,4,64,power_law_1.2,0.16481280326843262
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,4096,1536,8,128,4,64,power_law_1.2,0.17301759719848633
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,4096,1536,8,128,4,64,power_law_1.2,0.24455680847167968
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,4096,1536,8,128,4,64,power_law_1.2,0.3349503993988037
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,4096,1536,8,128,4,64,power_law_1.2,0.5919360160827637
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,4096,1536,8,128,4,64,power_law_1.2,0.600767993927002
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,4096,1536,8,128,4,64,balanced,0.2417866587638855
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,4096,1536,8,128,4,64,power_law_1.2,0.9444543838500976
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,4096,1536,8,128,4,64,power_law_1.2,1.5643263816833497
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,4096,1536,8,128,4,64,power_law_1.2,2.9568384170532225
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,4096,1536,8,128,4,64,balanced,0.39379199345906574
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,4096,1536,8,128,8,32,balanced,0.03349866718053818
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,4096,1536,8,128,8,32,balanced,0.029472000896930695
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,4096,1536,8,128,8,32,balanced,0.029482667644818623
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,4096,1536,8,128,8,32,balanced,0.030458666384220123
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,4096,1536,8,128,4,64,power_law_1.2,0.026745599508285523
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,4096,1536,8,128,8,32,balanced,0.03200533241033554
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,4096,1536,8,128,8,32,balanced,0.03646933287382126
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,4096,1536,8,128,4,64,balanced,0.7514826456705729
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,4096,1536,8,128,4,64,power_law_1.2,0.02595840096473694
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,4096,1536,8,128,8,32,balanced,0.03677333394686381
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,4096,1536,8,128,4,64,power_law_1.2,0.02661119997501373
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,4096,1536,8,128,8,32,balanced,0.03675200045108795
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,4096,1536,8,128,4,64,power_law_1.2,0.028537601232528687
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,4096,1536,8,128,8,32,balanced,0.036362667878468834
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,4096,1536,8,128,4,64,power_law_1.2,0.02868480086326599
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,4096,1536,8,128,8,32,balanced,0.036874666810035706
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,4096,1536,8,128,4,64,power_law_1.2,0.02969599962234497
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,4096,1536,8,128,8,32,balanced,0.03733866661787033
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,4096,1536,8,128,4,64,power_law_1.2,0.030188798904418945
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,4096,1536,8,128,8,32,balanced,0.038191998998324074
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,4096,1536,8,128,4,64,power_law_1.2,0.03057279884815216
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,4096,1536,8,128,8,32,balanced,0.03913066784540812
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,4096,1536,8,128,4,64,power_law_1.2,0.030720001459121703
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,4096,1536,8,128,8,32,balanced,0.04222933451334635
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,4096,1536,8,128,8,32,balanced,0.032474666833877563
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,4096,1536,8,128,4,64,power_law_1.2,0.032051199674606325
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,4096,1536,8,128,8,32,balanced,0.043285335103670754
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,4096,1536,8,128,4,64,power_law_1.2,0.033657601475715636
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,4096,1536,8,128,8,32,balanced,0.04418666660785675
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,4096,1536,8,128,8,32,balanced,0.03188266605138779
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,4096,1536,8,128,4,64,power_law_1.2,0.03446399867534637
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,4096,1536,8,128,8,32,balanced,0.03159466634194056
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,4096,1536,8,128,8,32,balanced,0.04445866743723551
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,4096,1536,8,128,8,32,balanced,0.033802665770053864
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,4096,1536,8,128,4,64,power_law_1.2,0.03623040020465851
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,4096,1536,8,128,8,32,balanced,0.04647466540336609
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,4096,1536,8,128,8,32,balanced,0.03606399893760681
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,4096,1536,8,128,4,64,power_law_1.2,0.037990400195121767
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,4096,1536,8,128,8,32,balanced,0.03833066672086716
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,4096,1536,8,128,8,32,balanced,0.047695999344189964
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,4096,1536,8,128,4,64,power_law_1.2,0.04251520037651062
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,4096,1536,8,128,8,32,balanced,0.036501333117485046
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,4096,1536,8,128,8,32,balanced,0.026261332134405773
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,4096,1536,8,128,4,64,power_law_1.2,0.045798400044441225
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,4096,1536,8,128,8,32,balanced,0.050853331883748375
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,4096,1536,8,128,8,32,balanced,0.036848001182079315
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,4096,1536,8,128,8,32,balanced,0.02606933315594991
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,4096,1536,8,128,8,32,balanced,0.02629866699377696
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,4096,1536,8,128,8,32,balanced,0.036757332583268486
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,4096,1536,8,128,8,32,balanced,0.05596800148487091
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,4096,1536,8,128,8,32,balanced,0.028336000939210255
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,4096,1536,8,128,8,32,balanced,0.03726933399836222
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,4096,1536,8,128,4,64,power_law_1.2,0.05672320127487183
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,4096,1536,8,128,8,32,balanced,0.029733332494894665
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,4096,1536,8,128,8,32,balanced,0.037632000943024956
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,4096,1536,8,128,4,64,power_law_1.2,0.0686784029006958
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,4096,1536,8,128,8,32,balanced,0.030805334448814392
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,4096,1536,8,128,8,32,balanced,0.07137600084145863
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,4096,1536,8,128,8,32,balanced,0.030991998811562855
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,4096,1536,8,128,8,32,balanced,0.03770133356253306
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,4096,1536,8,128,4,64,power_law_1.2,0.08475520014762879
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,4096,1536,8,128,8,32,balanced,0.03072533259789149
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,4096,1536,8,128,8,32,balanced,0.03987200061480204
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,4096,1536,8,128,8,32,balanced,0.03084266682465871
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,4096,1536,8,128,8,32,balanced,0.031386665999889374
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,4096,1536,8,128,8,32,balanced,0.041050667564074196
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,4096,1536,8,128,8,32,balanced,0.068271999557813
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,4096,1536,8,128,8,32,balanced,0.03175999969244003
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,4096,1536,8,128,4,64,power_law_1.2,0.10384000539779663
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,4096,1536,8,128,8,32,balanced,0.042506664991378784
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,4096,1536,8,128,8,32,balanced,0.032485333581765495
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,4096,1536,8,128,4,64,power_law_1.2,0.1385151982307434
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,4096,1536,8,128,8,32,balanced,0.033471999069054924
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,4096,1536,8,128,8,32,balanced,0.04260799785455068
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,4096,1536,8,128,8,32,balanced,0.033957332372665405
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,4096,1536,8,128,8,32,balanced,0.04625066618124644
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,4096,1536,8,128,8,32,balanced,0.09112000465393066
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,4096,1536,8,128,4,64,power_law_1.2,0.20784640312194824
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,4096,1536,8,128,8,32,balanced,0.04790933430194855
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,4096,1536,8,128,4,64,power_law_1.2,0.2742399930953979
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,4096,1536,8,128,8,32,balanced,0.037658666570981346
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,4096,1536,8,128,8,32,balanced,0.0369759996732076
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,4096,1536,8,128,8,32,balanced,0.0490880012512207
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,4096,1536,8,128,8,32,balanced,0.060693333546320595
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,4096,1536,8,128,4,64,power_law_1.2,0.3801791906356812
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,4096,1536,8,128,8,32,power_law_1.01,0.03575679957866669
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,4096,1536,8,128,8,32,balanced,0.09351999560991923
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,4096,1536,8,128,8,32,power_law_1.01,0.03573119938373566
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,4096,1536,8,128,8,32,balanced,0.0712960014740626
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,4096,1536,8,128,8,32,power_law_1.01,0.029657599329948426
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,4096,1536,8,128,4,64,power_law_1.2,0.6533184051513672
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,4096,1536,8,128,8,32,balanced,0.038549333810806274
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,4096,1536,8,128,8,32,power_law_1.01,0.02861439883708954
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,4096,1536,8,128,8,32,power_law_1.01,0.03198080062866211
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,4096,1536,8,128,8,32,balanced,0.04281599819660187
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,4096,1536,8,128,8,32,power_law_1.01,0.030630400776863097
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,4096,1536,8,128,8,32,balanced,0.09091200431187947
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,4096,1536,8,128,8,32,power_law_1.01,0.03224320113658905
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,4096,1536,8,128,4,64,power_law_1.2,0.7482816219329834
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,4096,1536,8,128,8,32,balanced,0.04399999976158142
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,4096,1536,8,128,8,32,power_law_1.01,0.03172479867935181
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,4096,1536,8,128,8,32,power_law_1.01,0.03427839875221252
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,4096,1536,8,128,8,32,power_law_1.01,0.035776001214981076
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,4096,1536,8,128,8,32,balanced,0.13384000460306802
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,4096,1536,8,128,4,64,power_law_1.2,1.0044480323791505
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,4096,1536,8,128,8,32,power_law_1.01,0.03480960130691528
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,4096,1536,8,128,8,32,balanced,0.10065066814422607
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,4096,1536,8,128,8,32,power_law_1.01,0.035750401020050046
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,4096,1536,8,128,8,32,balanced,0.05301333467165629
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,4096,1536,8,128,4,64,power_law_1.2,1.393331241607666
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,4096,1536,8,128,8,32,power_law_1.01,0.03730559945106506
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,4096,1536,8,128,8,32,power_law_1.01,0.03948160111904144
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,4096,1536,8,128,8,32,power_law_1.01,0.03601920008659363
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,4096,1536,8,128,8,32,power_law_1.01,0.03952000141143799
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,4096,1536,8,128,4,64,power_law_1.2,2.5714239120483398
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,4096,1536,8,128,8,32,balanced,0.059903999169667564
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,4096,1536,8,128,8,32,power_law_1.01,0.0282368004322052
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,4096,1536,8,128,8,32,power_law_1.01,0.04659200012683869
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,4096,1536,8,128,8,32,power_law_1.01,0.03638400137424469
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,4096,1536,8,128,8,32,balanced,0.13640532890955606
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,4096,1536,8,128,4,64,power_law_1.2,5.333139038085937
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,4096,1536,8,128,8,32,power_law_1.01,0.05264639854431152
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,4096,1536,8,128,8,32,power_law_1.01,0.026956799626350402
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,4096,1536,8,128,8,32,power_law_1.01,0.03729279935359955
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,4096,1536,8,128,8,32,power_law_1.01,0.05514240264892578
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,4096,1536,8,128,8,32,power_law_1.01,0.026368001103401185
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,4096,1536,8,128,8,32,power_law_1.01,0.03768959939479828
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,4096,1536,8,128,8,32,balanced,0.07894399762153625
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,4096,1536,8,128,8,32,power_law_1.01,0.057030397653579715
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,4096,1536,8,128,8,32,balanced,0.15269333124160767
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,4096,1536,8,128,8,32,power_law_1.01,0.02863360047340393
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,4096,1536,8,128,8,32,power_law_1.01,0.040166398882865904
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,4096,1536,8,128,8,32,power_law_1.01,0.04419200122356415
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,4096,1536,8,128,8,32,balanced,0.15781866510709128
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,4096,1536,8,128,8,32,power_law_1.01,0.029235199093818665
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,4096,1536,8,128,8,32,power_law_1.01,0.039987200498580934
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,4096,1536,8,128,8,32,power_law_1.01,0.04776319861412048
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,4096,1536,8,128,8,32,balanced,0.08991466959317525
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,4096,1536,8,128,8,32,power_law_1.01,0.03030399978160858
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,4096,1536,8,128,8,32,power_law_1.01,0.04073599874973297
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,4096,1536,8,128,8,32,power_law_1.01,0.04880000054836273
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,4096,1536,8,128,8,32,power_law_1.01,0.030630400776863097
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,4096,1536,8,128,8,32,power_law_1.01,0.042534399032592776
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,4096,1536,8,128,8,32,power_law_1.01,0.05013759732246399
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,4096,1536,8,128,8,32,power_law_1.01,0.03166080117225647
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,4096,1536,8,128,8,32,power_law_1.01,0.057574397325515746
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,4096,1536,8,128,8,32,power_law_1.01,0.04580479860305786
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,4096,1536,8,128,8,32,power_law_1.01,0.062489598989486694
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,4096,1536,8,128,8,32,power_law_1.01,0.032595199346542356
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,4096,1536,8,128,8,32,power_law_1.01,0.0460671991109848
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,4096,1536,8,128,8,32,balanced,0.12038933237393697
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,4096,1536,8,128,8,32,balanced,0.22332799434661865
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,4096,1536,8,128,8,32,power_law_1.01,0.07875199913978577
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,4096,1536,8,128,8,32,power_law_1.01,0.03304319977760315
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,4096,1536,8,128,8,32,power_law_1.01,0.050809597969055174
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,4096,1536,8,128,8,32,power_law_1.01,0.09140480160713196
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,4096,1536,8,128,8,32,power_law_1.01,0.034745600819587705
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,4096,1536,8,128,8,32,balanced,0.18182400862375894
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,4096,1536,8,128,8,32,power_law_1.01,0.057068800926208495
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,4096,1536,8,128,8,32,power_law_1.01,0.12152960300445556
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,4096,1536,8,128,8,32,power_law_1.01,0.0355648010969162
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,4096,1536,8,128,8,32,power_law_1.01,0.06417279839515685
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,4096,1536,8,128,8,32,power_law_1.01,0.12460160255432129
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,4096,1536,8,128,8,32,power_law_1.01,0.03699199855327606
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,4096,1536,8,128,8,32,power_law_1.01,0.16384639739990234
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,4096,1536,8,128,8,32,power_law_1.01,0.08266239762306213
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,4096,1536,8,128,8,32,power_law_1.01,0.21626880168914794
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,4096,1536,8,128,8,32,power_law_1.01,0.039468801021575926
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,4096,1536,8,128,8,32,power_law_1.01,0.09735040068626404
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,4096,1536,8,128,8,32,balanced,0.1485973298549652
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,4096,1536,8,128,8,32,power_law_1.01,0.30088319778442385
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,4096,1536,8,128,8,32,power_law_1.01,0.12422399520874024
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,4096,1536,8,128,8,32,power_law_1.01,0.04343680143356323
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,4096,1536,8,128,8,32,balanced,0.28272533416748047
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,4096,1536,8,128,8,32,power_law_1.01,0.32055680751800536
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,4096,1536,8,128,8,32,power_law_1.01,0.14851200580596924
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,4096,1536,8,128,8,32,power_law_1.01,0.04436480104923248
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,4096,1536,8,128,8,32,power_law_1.01,0.3913919925689697
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,4096,1536,8,128,8,32,power_law_1.01,0.19845759868621826
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,4096,1536,8,128,8,32,power_law_1.01,0.24387199878692628
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,4096,1536,8,128,8,32,power_law_1.01,0.6235648155212402
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,4096,1536,8,128,8,32,power_law_1.01,0.052857601642608644
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,4096,1536,8,128,8,32,power_law_1.01,0.371891188621521
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,4096,1536,8,128,8,32,power_law_1.01,1.6527360916137694
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,4096,1536,8,128,8,32,power_law_1.01,0.06920959949493408
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,4096,1536,8,128,8,32,power_law_1.01,0.43009281158447266
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,4096,1536,8,128,8,32,balanced,0.21636799971262613
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,4096,1536,8,128,8,32,power_law_1.01,0.07049599885940552
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,4096,1536,8,128,8,32,power_law_1.01,0.5901567935943604
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,4096,1536,8,128,8,32,balanced,0.266810675462087
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,4096,1536,8,128,8,32,power_law_1.01,0.08769919872283935
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,4096,1536,8,128,8,32,power_law_1.01,0.8707712173461915
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,4096,1536,8,128,8,32,balanced,0.33894399801890057
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,4096,1536,8,128,8,32,power_law_1.01,0.12331520318984986
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,4096,1536,8,128,8,32,power_law_1.01,1.7558271408081054
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,4096,1536,8,128,8,32,power_law_1.01,0.2043776035308838
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,4096,1536,8,128,8,32,power_law_1.01,0.1932927966117859
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,4096,1536,8,128,8,32,power_law_1.01,0.29809279441833497
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,4096,1536,8,128,8,32,power_law_1.2,0.03580799996852875
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,4096,1536,8,128,8,32,balanced,0.2897599935531616
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,4096,1536,8,128,8,32,power_law_1.2,0.02871040105819702
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,4096,1536,8,128,8,32,power_law_1.01,0.35438721179962157
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,4096,1536,8,128,8,32,power_law_1.2,0.02933120131492615
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,4096,1536,8,128,8,32,power_law_1.2,0.03110400140285492
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,4096,1536,8,128,8,32,power_law_1.01,0.708019208908081
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,4096,1536,8,128,8,32,power_law_1.2,0.03185279965400696
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,4096,1536,8,128,8,32,power_law_1.2,0.03578239977359772
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,4096,1536,8,128,8,32,power_law_1.01,0.7375232219696045
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,4096,1536,8,128,8,32,power_law_1.2,0.0359935998916626
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,4096,1536,8,128,8,32,balanced,0.5099786520004272
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,4096,1536,8,128,8,32,power_law_1.01,0.8814208030700683
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,4096,1536,8,128,8,32,power_law_1.2,0.03978880047798157
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,4096,1536,8,128,8,32,power_law_1.2,0.0441536009311676
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,4096,1536,8,128,8,32,balanced,0.3530293305714925
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,4096,1536,8,128,8,32,power_law_1.01,1.3166208267211914
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,4096,1536,8,128,8,32,power_law_1.2,0.05051519870758057
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,4096,1536,8,128,8,32,power_law_1.2,0.054713600873947145
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,4096,1536,8,128,8,32,power_law_1.01,2.8265663146972657
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,4096,1536,8,128,8,32,power_law_1.2,0.05995519757270813
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,4096,1536,8,128,8,32,power_law_1.2,0.0716480016708374
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,4096,1536,8,128,8,32,power_law_1.2,0.045177599787712096
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,4096,1536,8,128,8,32,power_law_1.2,0.047788798809051514
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,4096,1536,8,128,8,32,power_law_1.2,0.05081599950790405
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,4096,1536,8,128,8,32,balanced,0.4928319851557414
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,4096,1536,8,128,8,32,power_law_1.2,0.052083200216293334
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,4096,1536,8,128,8,32,power_law_1.2,0.061612802743911746
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,4096,1536,8,128,8,32,power_law_1.2,0.07294719815254211
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,4096,1536,8,128,8,32,power_law_1.2,0.09773439764976502
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,4096,1536,8,128,8,32,balanced,0.5459946791330973
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,4096,1536,8,128,8,32,power_law_1.2,0.0992255985736847
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,4096,1536,8,128,8,32,power_law_1.2,0.14391679763793946
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,4096,1536,8,128,8,32,power_law_1.2,0.16497279405593873
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,4096,1536,8,128,8,32,power_law_1.2,0.26097280979156495
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,4096,1536,8,128,8,32,power_law_1.2,0.31912961006164553
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,4096,1536,8,128,8,32,power_law_1.2,0.43968000411987307
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,4096,1536,8,128,8,32,power_law_1.2,0.5662335872650146
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,4096,1536,8,128,8,32,power_law_1.2,0.7865536212921143
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,4096,1536,8,128,8,32,balanced,0.984597365061442
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,4096,1536,8,128,8,32,power_law_1.2,1.213548755645752
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,4096,1536,8,128,8,32,power_law_1.2,2.4734272003173827
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,4096,1536,8,128,8,32,power_law_1.2,0.0358271986246109
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,4096,1536,8,128,8,32,power_law_1.2,0.031974399089813234
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,4096,1536,8,128,8,32,balanced,1.0539733568827312
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,4096,1536,8,128,8,32,power_law_1.2,0.03265919983386993
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,4096,1536,8,128,8,32,power_law_1.2,0.03418239951133728
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,4096,1536,8,128,8,32,power_law_1.2,0.03438720107078552
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,4096,1536,8,128,8,32,power_law_1.2,0.03733119964599609
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,4096,1536,8,128,8,32,power_law_1.2,0.03592959940433502
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,4096,1536,8,128,8,32,power_law_1.2,0.036550399661064145
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,4096,1536,8,128,8,32,power_law_1.2,0.03744640052318573
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,4096,1536,8,128,8,32,power_law_1.2,0.0381632000207901
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,4096,1536,8,128,8,32,power_law_1.2,0.04049279987812042
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,4096,1536,8,128,8,32,power_law_1.2,0.040140798687934874
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,4096,1536,8,128,8,32,power_law_1.2,0.04199680089950562
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,4096,1536,8,128,8,32,power_law_1.2,0.04289920032024384
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,4096,1536,8,128,8,32,power_law_1.2,0.04794879853725433
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,4096,1536,8,128,8,32,power_law_1.2,0.04839679896831513
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,4096,1536,8,128,8,32,power_law_1.2,0.05281919836997986
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,4096,1536,8,128,8,32,power_law_1.2,0.06234239935874939
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,4096,1536,8,128,8,32,power_law_1.2,0.06815360188484192
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,4096,1536,8,128,8,32,power_law_1.2,0.08922240138053894
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,4096,1536,8,128,8,32,power_law_1.2,0.10347520112991333
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,4096,1536,8,128,8,32,power_law_1.2,0.14551680088043212
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,4096,1536,8,128,8,32,power_law_1.2,0.17536640167236328
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,4096,1536,8,128,8,32,power_law_1.2,0.2617727994918823
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,4096,1536,8,128,8,32,power_law_1.2,0.30405120849609374
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,4096,1536,8,128,8,32,power_law_1.2,0.028204798698425293
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,4096,1536,8,128,8,32,power_law_1.2,0.5075071811676025
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,4096,1536,8,128,8,32,power_law_1.2,0.026476800441741943
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,4096,1536,8,128,8,32,power_law_1.2,0.6690944194793701
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,4096,1536,8,128,8,32,power_law_1.2,0.02656640112400055
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,4096,1536,8,128,16,16,balanced,0.03937066594759623
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,4096,1536,8,128,8,32,power_law_1.2,0.028575998544692994
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,4096,1536,8,128,8,32,power_law_1.2,0.8055168151855469
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,4096,1536,8,128,16,16,balanced,0.033088001112143196
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,4096,1536,8,128,8,32,power_law_1.2,0.029388800263404846
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,4096,1536,8,128,8,32,power_law_1.2,1.5390015602111817
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,4096,1536,8,128,16,16,balanced,0.033573334415753685
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,4096,1536,8,128,8,32,power_law_1.2,0.030105599761009218
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,4096,1536,8,128,16,16,balanced,0.035674666364987694
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,4096,1536,8,128,8,32,power_law_1.2,0.030937600135803222
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,4096,1536,8,128,8,32,power_law_1.2,3.475795364379883
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,4096,1536,8,128,16,16,balanced,0.03698666642109553
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,4096,1536,8,128,8,32,power_law_1.2,0.03252480030059814
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,4096,1536,8,128,16,16,balanced,0.03823466598987579
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,4096,1536,8,128,8,32,power_law_1.2,0.033055999875068666
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,4096,1536,8,128,16,16,balanced,0.03809600075085958
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,4096,1536,8,128,8,32,power_law_1.2,0.03340800106525421
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,4096,1536,8,128,16,16,balanced,0.03811199963092804
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,4096,1536,8,128,8,32,power_law_1.2,0.03553279936313629
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,4096,1536,8,128,16,16,balanced,0.03824000060558319
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,4096,1536,8,128,8,32,power_law_1.2,0.03687680065631867
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,4096,1536,8,128,16,16,balanced,0.038346665600935616
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,4096,1536,8,128,8,32,power_law_1.2,0.0387584000825882
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,4096,1536,8,128,16,16,balanced,0.04453866680463155
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,4096,1536,8,128,8,32,power_law_1.2,0.04243200123310089
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,4096,1536,8,128,16,16,balanced,0.03922666609287262
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,4096,1536,8,128,16,16,balanced,0.03908800085385641
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,4096,1536,8,128,8,32,power_law_1.2,0.045286399126052854
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,4096,1536,8,128,16,16,balanced,0.04030400017897288
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,4096,1536,8,128,8,32,power_law_1.2,0.04633600115776062
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,4096,1536,8,128,16,16,balanced,0.04268266757329305
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,4096,1536,8,128,16,16,balanced,0.0433599998553594
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,4096,1536,8,128,8,32,power_law_1.2,0.054527997970581055
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,4096,1536,8,128,16,16,balanced,0.04580800235271454
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,4096,1536,8,128,16,16,balanced,0.03212266663710276
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,4096,1536,8,128,16,16,balanced,0.050586665670077004
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,4096,1536,8,128,8,32,power_law_1.2,0.07366399765014649
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,4096,1536,8,128,16,16,balanced,0.0322773332397143
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,4096,1536,8,128,8,32,power_law_1.2,0.09174399971961975
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,4096,1536,8,128,16,16,balanced,0.051541333397229515
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,4096,1536,8,128,16,16,balanced,0.03277866790692011
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,4096,1536,8,128,16,16,balanced,0.03461866577466329
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,4096,1536,8,128,8,32,power_law_1.2,0.10670080184936523
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,4096,1536,8,128,16,16,balanced,0.057328000664711
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,4096,1536,8,128,16,16,balanced,0.03692266593376795
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,4096,1536,8,128,8,32,power_law_1.2,0.14384000301361083
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,4096,1536,8,128,16,16,balanced,0.03773866593837738
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,4096,1536,8,128,16,16,balanced,0.06610133250554402
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,4096,1536,8,128,16,16,balanced,0.038021333515644073
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,4096,1536,8,128,8,32,power_law_1.2,0.2081536054611206
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,4096,1536,8,128,16,16,balanced,0.0383146678407987
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,4096,1536,8,128,16,16,balanced,0.07338133454322815
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,4096,1536,8,128,8,32,power_law_1.2,0.27820160388946535
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,4096,1536,8,128,16,16,balanced,0.038975998759269714
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,4096,1536,8,128,8,32,power_law_1.2,0.4446144104003906
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,4096,1536,8,128,16,16,balanced,0.03920533259709676
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,4096,1536,8,128,16,16,balanced,0.0817493349313736
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,4096,1536,8,128,16,16,balanced,0.03941333293914795
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,4096,1536,8,128,8,32,power_law_1.2,0.5013311862945556
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,4096,1536,8,128,16,16,balanced,0.039247999588648476
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,4096,1536,8,128,16,16,balanced,0.040549332896868386
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,4096,1536,8,128,8,32,power_law_1.2,0.9817983627319335
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,4096,1536,8,128,16,16,balanced,0.1048959990342458
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,4096,1536,8,128,16,16,balanced,0.041402667760849
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,4096,1536,8,128,16,16,balanced,0.04469866553942362
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,4096,1536,8,128,8,32,power_law_1.2,1.1996479988098145
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,4096,1536,8,128,16,16,balanced,0.044309332966804504
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,4096,1536,8,128,16,16,balanced,0.0461706668138504
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,4096,1536,8,128,8,32,power_law_1.2,1.7710464477539063
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,4096,1536,8,128,16,16,balanced,0.12250133355458577
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,4096,1536,8,128,16,16,balanced,0.05031999945640564
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,4096,1536,8,128,8,32,power_law_1.2,3.0021120071411134
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,4096,1536,8,128,16,16,balanced,0.05392000079154968
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,4096,1536,8,128,8,32,power_law_1.2,5.043379211425782
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,4096,1536,8,128,16,16,power_law_1.01,0.04576640129089356
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,4096,1536,8,128,16,16,balanced,0.06655466556549072
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,4096,1536,8,128,16,16,power_law_1.01,0.03824639916419983
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,4096,1536,8,128,16,16,power_law_1.01,0.03537279963493347
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,4096,1536,8,128,16,16,power_law_1.01,0.03322240114212036
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,4096,1536,8,128,16,16,balanced,0.18212266763051352
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,4096,1536,8,128,16,16,balanced,0.0804746647675832
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,4096,1536,8,128,16,16,power_law_1.01,0.03420799970626831
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,4096,1536,8,128,16,16,power_law_1.01,0.03272959887981415
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,4096,1536,8,128,16,16,power_law_1.01,0.0359935998916626
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,4096,1536,8,128,16,16,power_law_1.01,0.034560000896453856
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,4096,1536,8,128,16,16,balanced,0.09733866651852925
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,4096,1536,8,128,16,16,power_law_1.01,0.03665919899940491
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,4096,1536,8,128,16,16,power_law_1.01,0.035724800825119016
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,4096,1536,8,128,16,16,power_law_1.01,0.038073599338531494
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,4096,1536,8,128,16,16,power_law_1.01,0.037222400307655334
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,4096,1536,8,128,16,16,balanced,0.11212266484896342
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,4096,1536,8,128,16,16,power_law_1.01,0.03857919871807099
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,4096,1536,8,128,16,16,power_law_1.01,0.03700479865074158
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,4096,1536,8,128,16,16,power_law_1.01,0.03860479891300202
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,4096,1536,8,128,16,16,power_law_1.01,0.03788160085678101
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,4096,1536,8,128,16,16,balanced,0.22398932774861655
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,4096,1536,8,128,16,16,power_law_1.01,0.0387584000825882
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,4096,1536,8,128,16,16,power_law_1.01,0.03844479918479919
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,4096,1536,8,128,16,16,balanced,0.15455999970436096
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,4096,1536,8,128,16,16,power_law_1.01,0.03947519958019256
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,4096,1536,8,128,16,16,power_law_1.01,0.0390720009803772
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,4096,1536,8,128,16,16,power_law_1.01,0.042438399791717527
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,4096,1536,8,128,16,16,power_law_1.01,0.04012160003185272
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,4096,1536,8,128,16,16,power_law_1.01,0.04481280148029328
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,4096,1536,8,128,16,16,power_law_1.01,0.04136959910392761
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,4096,1536,8,128,16,16,power_law_1.01,0.04336000084877014
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,4096,1536,8,128,16,16,power_law_1.01,0.045407998561859134
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,4096,1536,8,128,16,16,power_law_1.01,0.045465600490570066
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,4096,1536,8,128,16,16,balanced,0.1873226761817932
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,4096,1536,8,128,16,16,power_law_1.01,0.0480320006608963
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,4096,1536,8,128,16,16,power_law_1.01,0.04855040013790131
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,4096,1536,8,128,16,16,power_law_1.01,0.05053439736366272
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,4096,1536,8,128,16,16,power_law_1.01,0.05052800178527832
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,4096,1536,8,128,16,16,power_law_1.01,0.05431039929389954
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,4096,1536,8,128,16,16,power_law_1.01,0.05382400155067444
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,4096,1536,8,128,16,16,balanced,0.27449599901835126
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,4096,1536,8,128,16,16,power_law_1.01,0.06099200248718262
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,4096,1536,8,128,16,16,power_law_1.01,0.06183680295944214
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,4096,1536,8,128,16,16,power_law_1.01,0.06741120219230652
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,4096,1536,8,128,16,16,power_law_1.01,0.0676800012588501
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,4096,1536,8,128,16,16,power_law_1.01,0.06584320068359376
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,4096,1536,8,128,16,16,balanced,0.27057600021362305
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,4096,1536,8,128,16,16,power_law_1.01,0.08819839954376221
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,4096,1536,8,128,16,16,power_law_1.01,0.0779263973236084
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,4096,1536,8,128,16,16,power_law_1.01,0.10142719745635986
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,4096,1536,8,128,16,16,power_law_1.01,0.09096320271492005
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,4096,1536,8,128,16,16,power_law_1.01,0.1320639967918396
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,4096,1536,8,128,16,16,power_law_1.01,0.11356799602508545
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,4096,1536,8,128,16,16,power_law_1.01,0.15923839807510376
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,4096,1536,8,128,16,16,power_law_1.01,0.1322368025779724
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,4096,1536,8,128,16,16,power_law_1.01,0.22797439098358155
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,4096,1536,8,128,16,16,power_law_1.01,0.183404803276062
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,4096,1536,8,128,16,16,power_law_1.01,0.25557119846343995
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,4096,1536,8,128,16,16,power_law_1.01,0.2191551923751831
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,4096,1536,8,128,16,16,power_law_1.01,0.3895488023757935
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,4096,1536,8,128,16,16,power_law_1.01,0.3088320016860962
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,4096,1536,8,128,16,16,balanced,0.3521600166956584
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,4096,1536,8,128,16,16,power_law_1.01,0.5158656120300293
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,4096,1536,8,128,16,16,power_law_1.01,0.434003210067749
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,4096,1536,8,128,16,16,power_law_1.01,0.7060095787048339
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,4096,1536,8,128,16,16,power_law_1.01,0.5360320091247559
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,4096,1536,8,128,16,16,balanced,0.37517865498860675
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,4096,1536,8,128,16,16,power_law_1.01,0.9903360366821289
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,4096,1536,8,128,16,16,power_law_1.01,0.7880191802978516
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,4096,1536,8,128,16,16,power_law_1.01,2.44213752746582
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,4096,1536,8,128,16,16,power_law_1.01,1.5337727546691895
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,4096,1536,8,128,16,16,balanced,0.42455466588338214
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,4096,1536,8,128,16,16,power_law_1.2,0.04482559859752655
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,4096,1536,8,128,16,16,power_law_1.2,0.03341439962387085
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,4096,1536,8,128,16,16,power_law_1.2,0.03400959968566895
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,4096,1536,8,128,16,16,power_law_1.2,0.03583999872207642
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,4096,1536,8,128,16,16,power_law_1.2,0.03788160085678101
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,4096,1536,8,128,16,16,power_law_1.2,0.04191359877586365
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,4096,1536,8,128,16,16,power_law_1.2,0.03825919926166534
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,4096,1536,8,128,16,16,power_law_1.2,0.03826560080051422
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,4096,1536,8,128,16,16,power_law_1.2,0.03871360123157501
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,4096,1536,8,128,16,16,power_law_1.2,0.04043520092964172
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,4096,1536,8,128,16,16,power_law_1.2,0.0434112012386322
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,4096,1536,8,128,16,16,power_law_1.2,0.0459199994802475
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,4096,1536,8,128,16,16,power_law_1.2,0.044614401459693906
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,4096,1536,8,128,16,16,power_law_1.2,0.04938879907131195
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,4096,1536,8,128,16,16,balanced,0.6264853477478027
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,4096,1536,8,128,16,16,power_law_1.2,0.05123199820518494
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,4096,1536,8,128,16,16,power_law_1.2,0.05472000241279602
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,4096,1536,8,128,16,16,power_law_1.2,0.06172159910202026
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,4096,1536,8,128,16,16,power_law_1.2,0.06883839964866638
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,4096,1536,8,128,16,16,power_law_1.2,0.07035520076751708
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,4096,1536,8,128,16,16,power_law_1.2,0.08674560189247131
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,4096,1536,8,128,16,16,power_law_1.2,0.10044159889221191
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,4096,1536,8,128,16,16,power_law_1.2,0.13063679933547973
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,4096,1536,8,128,16,16,balanced,0.7396693229675293
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,4096,1536,8,128,16,16,power_law_1.2,0.14240000247955323
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,4096,1536,8,128,16,16,power_law_1.2,0.22721920013427735
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,4096,1536,8,128,16,16,power_law_1.2,0.23224320411682128
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,4096,1536,8,128,16,16,power_law_1.2,0.3500224113464355
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,4096,1536,8,128,16,16,power_law_1.2,0.5472832202911377
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,4096,1536,8,128,16,16,power_law_1.2,0.7295551776885987
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,4096,1536,8,128,16,16,power_law_1.2,1.3691967964172362
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,4096,1536,8,128,16,16,power_law_1.2,2.9488704681396483
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,4096,1536,8,128,16,16,balanced,1.2420639991760254
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,4096,1536,8,128,16,16,power_law_1.2,0.03850240111351013
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,4096,1536,8,128,16,16,power_law_1.2,0.032153600454330446
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,4096,1536,8,128,16,16,power_law_1.2,0.03227519989013672
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,4096,1536,8,128,16,16,power_law_1.2,0.034534400701522826
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,4096,1536,8,128,16,16,power_law_1.2,0.03535360097885132
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,4096,1536,8,128,16,16,power_law_1.2,0.03706879913806915
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,4096,1536,8,128,16,16,power_law_1.2,0.03723520040512085
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,4096,1536,8,128,16,16,power_law_1.2,0.0379967987537384
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,4096,1536,8,128,16,16,power_law_1.2,0.03871360123157501
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,4096,1536,8,128,16,16,power_law_1.2,0.039155200123786926
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,4096,1536,8,128,16,16,power_law_1.2,0.04076800048351288
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,4096,1536,8,128,16,16,power_law_1.2,0.04254719913005829
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,4096,1536,8,128,16,16,power_law_1.2,0.04371840059757233
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,4096,1536,8,128,16,16,power_law_1.2,0.04528000056743622
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,4096,1536,8,128,16,16,power_law_1.2,0.04932479858398438
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,4096,1536,8,128,16,16,power_law_1.2,0.05085440278053284
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,4096,1536,8,128,16,16,power_law_1.2,0.05475839972496033
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,4096,1536,8,128,16,16,power_law_1.2,0.06417279839515685
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,4096,1536,8,128,16,16,power_law_1.2,0.07749119997024537
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,4096,1536,8,128,16,16,power_law_1.2,0.09985920190811157
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,4096,1536,8,128,16,16,power_law_1.2,0.11535359621047973
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,4096,1536,8,128,16,16,power_law_1.2,0.15972479581832885
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,4096,1536,8,128,32,8,balanced,0.03490666548411051
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,4096,1536,8,128,16,16,power_law_1.2,0.17004159688949586
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,4096,1536,8,128,32,8,balanced,0.03313066562016805
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,4096,1536,8,128,16,16,power_law_1.2,0.30811519622802735
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,4096,1536,8,128,32,8,balanced,0.03430933256944021
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,4096,1536,8,128,16,16,power_law_1.2,0.34092159271240235
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,4096,1536,8,128,32,8,balanced,0.03598399957021078
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,4096,1536,8,128,32,8,balanced,0.04483733574549357
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,4096,1536,8,128,16,16,power_law_1.2,0.49706878662109377
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,4096,1536,8,128,32,8,balanced,0.04823466638724009
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,4096,1536,8,128,16,16,power_law_1.2,0.6784192085266113
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,4096,1536,8,128,32,8,balanced,0.04011733333269755
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,4096,1536,8,128,32,8,balanced,0.04057066639264425
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,4096,1536,8,128,16,16,power_law_1.2,0.9852607727050782
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,4096,1536,8,128,32,8,balanced,0.03991466760635376
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,4096,1536,8,128,16,16,power_law_1.2,1.3507712364196778
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,4096,1536,8,128,32,8,balanced,0.0405173326532046
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,4096,1536,8,128,32,8,balanced,0.033861334125200905
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,4096,1536,8,128,32,8,balanced,0.04146133363246918
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,4096,1536,8,128,16,16,power_law_1.2,3.854924774169922
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,4096,1536,8,128,32,8,balanced,0.03238933285077413
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,4096,1536,8,128,32,8,balanced,0.04770666857560476
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,4096,1536,8,128,32,8,balanced,0.033013333876927696
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,4096,1536,8,128,32,8,balanced,0.04770133395989736
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,4096,1536,8,128,32,8,balanced,0.036176001032193504
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,4096,1536,8,128,32,8,balanced,0.04398933549722036
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,4096,1536,8,128,32,8,balanced,0.04419733087221781
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,4096,1536,8,128,32,8,balanced,0.0458133320013682
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,4096,1536,8,128,32,8,balanced,0.045738667249679565
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,4096,1536,8,128,32,8,balanced,0.0473280002673467
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,4096,1536,8,128,32,8,balanced,0.04525866607824961
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,4096,1536,8,128,32,8,balanced,0.04528533418973287
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,4096,1536,8,128,32,8,balanced,0.06113600234190623
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,4096,1536,8,128,32,8,balanced,0.04516266783078512
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,4096,1536,8,128,32,8,balanced,0.06205333272616068
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,4096,1536,8,128,32,8,balanced,0.04586133360862732
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,4096,1536,8,128,32,8,balanced,0.04636266827583313
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,4096,1536,8,128,32,8,balanced,0.06428800026575725
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,4096,1536,8,128,32,8,balanced,0.04700266818205515
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,4096,1536,8,128,32,8,balanced,0.07358400026957194
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,4096,1536,8,128,32,8,balanced,0.0481279989083608
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,4096,1536,8,128,32,8,balanced,0.04862933357556661
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,4096,1536,8,128,32,8,balanced,0.08772266904513042
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,4096,1536,8,128,32,8,balanced,0.0491839994986852
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,4096,1536,8,128,32,8,balanced,0.05037866532802582
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,4096,1536,8,128,32,8,balanced,0.05821333328882853
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,4096,1536,8,128,32,8,balanced,0.11846933762232463
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,4096,1536,8,128,32,8,balanced,0.06213866670926412
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,4096,1536,8,128,32,8,balanced,0.06250133117039998
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,4096,1536,8,128,32,8,balanced,0.10821333527565002
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,4096,1536,8,128,32,8,balanced,0.07702933251857758
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,4096,1536,8,128,32,8,balanced,0.08961600065231323
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,4096,1536,8,128,32,8,balanced,0.14619732896486917
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,4096,1536,8,128,32,8,power_law_1.01,0.037248000502586365
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,4096,1536,8,128,32,8,balanced,0.12127466996510823
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,4096,1536,8,128,32,8,power_law_1.01,0.033843201398849485
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,4096,1536,8,128,32,8,power_law_1.01,0.034176000952720643
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,4096,1536,8,128,32,8,power_law_1.01,0.035776001214981076
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,4096,1536,8,128,32,8,balanced,0.13962666193644205
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,4096,1536,8,128,32,8,balanced,0.18915200233459473
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,4096,1536,8,128,32,8,power_law_1.01,0.03814400136470795
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,4096,1536,8,128,32,8,power_law_1.01,0.045203199982643126
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,4096,1536,8,128,32,8,power_law_1.01,0.0361407995223999
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,4096,1536,8,128,32,8,power_law_1.01,0.04074240028858185
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,4096,1536,8,128,32,8,balanced,0.20137067635854086
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,4096,1536,8,128,32,8,power_law_1.01,0.04081920087337494
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,4096,1536,8,128,32,8,power_law_1.01,0.034227201342582704
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,4096,1536,8,128,32,8,power_law_1.01,0.04154880046844482
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,4096,1536,8,128,32,8,power_law_1.01,0.03304960131645203
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,4096,1536,8,128,32,8,power_law_1.01,0.041920000314712526
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,4096,1536,8,128,32,8,balanced,0.27197333176930744
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,4096,1536,8,128,32,8,power_law_1.01,0.03578880131244659
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,4096,1536,8,128,32,8,power_law_1.01,0.04442239999771118
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,4096,1536,8,128,32,8,power_law_1.01,0.03820799887180328
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,4096,1536,8,128,32,8,balanced,0.2523840069770813
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,4096,1536,8,128,32,8,power_law_1.01,0.04787839949131012
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,4096,1536,8,128,32,8,power_law_1.01,0.043731200695037845
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,4096,1536,8,128,32,8,power_law_1.01,0.048416000604629514
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,4096,1536,8,128,32,8,power_law_1.01,0.044326400756835936
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,4096,1536,8,128,32,8,power_law_1.01,0.05149440169334411
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,4096,1536,8,128,32,8,power_law_1.01,0.058764797449111936
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,4096,1536,8,128,32,8,power_law_1.01,0.043961599469184875
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,4096,1536,8,128,32,8,power_law_1.01,0.058976000547409056
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,4096,1536,8,128,32,8,power_law_1.01,0.04485119879245758
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,4096,1536,8,128,32,8,power_law_1.01,0.06819199919700622
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,4096,1536,8,128,32,8,power_law_1.01,0.045900800824165346
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,4096,1536,8,128,32,8,balanced,0.3938453197479248
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,4096,1536,8,128,32,8,balanced,0.3656800190607707
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,4096,1536,8,128,32,8,power_law_1.01,0.07573760151863099
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,4096,1536,8,128,32,8,power_law_1.01,0.04810880124568939
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,4096,1536,8,128,32,8,power_law_1.01,0.0787392020225525
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,4096,1536,8,128,32,8,power_law_1.01,0.04901759922504425
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,4096,1536,8,128,32,8,power_law_1.01,0.09292799830436707
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,4096,1536,8,128,32,8,power_law_1.01,0.05123839974403381
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,4096,1536,8,128,32,8,power_law_1.01,0.11801600456237793
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,4096,1536,8,128,32,8,power_law_1.01,0.051820802688598636
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,4096,1536,8,128,32,8,power_law_1.01,0.1441856026649475
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,4096,1536,8,128,32,8,power_law_1.01,0.05623040199279785
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,4096,1536,8,128,32,8,power_law_1.01,0.05797119736671448
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,4096,1536,8,128,32,8,power_law_1.01,0.14289920330047606
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,4096,1536,8,128,32,8,power_law_1.01,0.06407039761543273
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,4096,1536,8,128,32,8,balanced,0.46778666973114014
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,4096,1536,8,128,32,8,power_law_1.01,0.1901952028274536
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,4096,1536,8,128,32,8,power_law_1.01,0.07245439887046815
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,4096,1536,8,128,32,8,balanced,0.4991733233133952
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,4096,1536,8,128,32,8,power_law_1.01,0.26213760375976564
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,4096,1536,8,128,32,8,power_law_1.01,0.07787520289421082
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,4096,1536,8,128,32,8,power_law_1.01,0.378604793548584
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,4096,1536,8,128,32,8,power_law_1.01,0.10124160051345825
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,4096,1536,8,128,32,8,power_law_1.01,0.5852223873138428
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,4096,1536,8,128,32,8,power_law_1.01,0.11934720277786255
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,4096,1536,8,128,32,8,power_law_1.01,0.7013247966766357
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,4096,1536,8,128,32,8,power_law_1.01,0.15777280330657958
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,4096,1536,8,128,32,8,power_law_1.01,1.239027214050293
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,4096,1536,8,128,32,8,power_law_1.01,0.19569920301437377
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,4096,1536,8,128,32,8,power_law_1.01,0.26677761077880857
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,4096,1536,8,128,32,8,power_law_1.01,2.3109695434570314
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,4096,1536,8,128,32,8,power_law_1.01,0.3520319938659668
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,4096,1536,8,128,32,8,balanced,0.5718079805374146
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,4096,1536,8,128,32,8,power_law_1.01,0.5126272201538086
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,4096,1536,8,128,32,8,power_law_1.01,0.6801407814025879
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,4096,1536,8,128,32,8,power_law_1.01,0.8387007713317871
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,4096,1536,8,128,32,8,power_law_1.01,1.224998378753662
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,4096,1536,8,128,32,8,balanced,0.7487680117289225
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,4096,1536,8,128,32,8,power_law_1.01,2.823289680480957
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,4096,1536,8,128,32,8,power_law_1.2,0.037324801087379456
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,4096,1536,8,128,32,8,power_law_1.2,0.03482879996299744
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,4096,1536,8,128,32,8,balanced,0.8926346302032471
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,4096,1536,8,128,32,8,power_law_1.2,0.03487359881401062
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,4096,1536,8,128,32,8,power_law_1.2,0.03701759874820709
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,4096,1536,8,128,32,8,power_law_1.2,0.037920001149177554
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,4096,1536,8,128,32,8,power_law_1.2,0.045049598813056944
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,4096,1536,8,128,32,8,power_law_1.2,0.041843199729919435
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,4096,1536,8,128,32,8,power_law_1.2,0.041407999396324155
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,4096,1536,8,128,32,8,power_law_1.2,0.0418368011713028
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,4096,1536,8,128,32,8,power_law_1.2,0.04305280148983002
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,4096,1536,8,128,32,8,power_law_1.2,0.04759039878845215
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,4096,1536,8,128,32,8,power_law_1.2,0.047167998552322385
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,4096,1536,8,128,32,8,power_law_1.2,0.04922879934310913
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,4096,1536,8,128,32,8,power_law_1.2,0.05420799851417542
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,4096,1536,8,128,32,8,power_law_1.2,0.05849599838256836
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,4096,1536,8,128,32,8,power_law_1.2,0.03726080060005188
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,4096,1536,8,128,32,8,power_law_1.2,0.06035199761390686
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,4096,1536,8,128,32,8,power_law_1.2,0.0691648006439209
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,4096,1536,8,128,32,8,power_law_1.2,0.032492798566818235
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,4096,1536,8,128,32,8,power_law_1.2,0.07786880135536194
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,4096,1536,8,128,32,8,power_law_1.2,0.03306879997253418
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,4096,1536,8,128,32,8,power_law_1.2,0.08460800051689148
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,4096,1536,8,128,32,8,power_law_1.2,0.03594880104064942
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,4096,1536,8,128,32,8,power_law_1.2,0.10321279764175414
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,4096,1536,8,128,32,8,power_law_1.2,0.037241598963737486
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,4096,1536,8,128,32,8,power_law_1.2,0.11681920289993286
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,4096,1536,8,128,32,8,power_law_1.2,0.04289279878139496
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,4096,1536,8,128,32,8,balanced,1.4621599515279133
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,4096,1536,8,128,32,8,power_law_1.2,0.15834879875183105
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,4096,1536,8,128,32,8,power_law_1.2,0.043398401141166686
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,4096,1536,8,128,32,8,power_law_1.2,0.19448319673538209
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,4096,1536,8,128,32,8,power_law_1.2,0.044249600172042845
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,4096,1536,8,128,32,8,power_law_1.2,0.04471679925918579
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,4096,1536,8,128,32,8,power_law_1.2,0.2275007963180542
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,4096,1536,8,128,32,8,power_law_1.2,0.046323201060295104
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,4096,1536,8,128,32,8,power_law_1.2,0.32666239738464353
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,4096,1536,8,128,32,8,power_law_1.2,0.04808320105075836
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,4096,1536,8,128,32,8,power_law_1.2,0.4738111972808838
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,4096,1536,8,128,32,8,power_law_1.2,0.04915199875831604
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,4096,1536,8,128,32,8,power_law_1.2,0.7078080177307129
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,4096,1536,8,128,32,8,balanced,1.756816069285075
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,4096,1536,8,128,32,8,power_law_1.2,0.05123199820518494
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,4096,1536,8,128,32,8,power_law_1.2,1.0184767723083497
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,4096,1536,8,128,32,8,power_law_1.2,0.05187839865684509
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,4096,1536,8,128,32,8,power_law_1.2,0.05697280168533325
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,4096,1536,8,128,32,8,power_law_1.2,1.3684160232543945
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,4096,1536,8,128,32,8,power_law_1.2,0.059385597705841064
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,4096,1536,8,128,32,8,power_law_1.2,3.1134464263916017
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,4096,1536,8,128,32,8,power_law_1.2,0.06657919883728028
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,4096,1536,8,128,32,8,power_law_1.2,0.07395200133323669
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,4096,1536,8,128,32,8,power_law_1.2,0.0877888023853302
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,4096,1536,8,128,32,8,power_law_1.2,0.11052800416946411
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,4096,1536,8,128,32,8,power_law_1.2,0.12390400171279907
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,4096,1536,8,128,32,8,power_law_1.2,0.16034560203552245
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,4096,1536,8,128,32,8,power_law_1.2,0.20297598838806152
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,4096,1536,8,128,32,8,power_law_1.2,0.3152575969696045
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,4096,1536,8,128,32,8,power_law_1.2,0.37706239223480226
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,4096,1536,8,128,32,8,power_law_1.2,0.6583615779876709
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,4096,1536,8,128,32,8,power_law_1.2,0.8208191871643067
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,4096,1536,8,128,32,8,power_law_1.2,0.8947775840759278
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,4096,1536,8,128,32,8,power_law_1.2,1.5833984375
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,4096,1536,8,128,32,8,power_law_1.2,4.034758377075195
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,6144,2560,8,160,8,32,balanced,0.05114666620890299
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,6144,2560,8,160,8,32,balanced,0.051269332567850746
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,6144,2560,8,160,8,32,balanced,0.04587733248869578
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,6144,2560,8,160,8,32,balanced,0.05169600248336792
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,6144,2560,8,160,8,32,balanced,0.05474133292833964
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,6144,2560,8,160,8,32,balanced,0.04599999884764353
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,6144,2560,8,160,8,32,balanced,0.045791998505592346
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,6144,2560,8,160,8,32,balanced,0.06823466718196869
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,6144,2560,8,160,8,32,balanced,0.050661335388819374
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,6144,2560,8,160,8,32,balanced,0.06819733480612437
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,6144,2560,8,160,8,32,balanced,0.052895997961362205
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,6144,2560,8,160,8,32,balanced,0.06869866450627644
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,6144,2560,8,160,8,32,balanced,0.054645334680875145
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,6144,2560,8,160,8,32,balanced,0.055439998706181846
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,6144,2560,8,160,8,32,balanced,0.0689333329598109
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,6144,2560,8,160,8,32,balanced,0.05632533133029938
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,6144,2560,8,160,8,32,balanced,0.07036800185839336
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,6144,2560,8,160,8,32,balanced,0.05619200070699056
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,6144,2560,8,160,8,32,balanced,0.06974933544794719
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,6144,2560,8,160,8,32,balanced,0.057034666339556374
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,6144,2560,8,160,8,32,balanced,0.0684746652841568
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,6144,2560,8,160,8,32,balanced,0.057914664347966514
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,6144,2560,8,160,8,32,balanced,0.06945066650708516
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,6144,2560,8,160,8,32,balanced,0.058378666639328
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,6144,2560,8,160,8,32,balanced,0.059621334075927734
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,6144,2560,8,160,8,32,balanced,0.07002666592597961
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,6144,2560,8,160,8,32,balanced,0.06150400141874949
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,6144,2560,8,160,8,32,balanced,0.07009066641330719
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,6144,2560,8,160,8,32,balanced,0.06676800052324931
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,6144,2560,8,160,8,32,balanced,0.07406400144100189
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,6144,2560,8,160,8,32,balanced,0.07150933146476746
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,6144,2560,8,160,8,32,balanced,0.04051200052102407
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,6144,2560,8,160,8,32,balanced,0.07318399846553802
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,6144,2560,8,160,8,32,balanced,0.07416533430417378
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,6144,2560,8,160,8,32,balanced,0.0848586658636729
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,6144,2560,8,160,8,32,balanced,0.040922666589419045
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,6144,2560,8,160,8,32,balanced,0.07352533439795177
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,6144,2560,8,160,8,32,balanced,0.041189332803090416
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,6144,2560,8,160,8,32,balanced,0.08966933687527974
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,6144,2560,8,160,8,32,balanced,0.08277333279450734
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,6144,2560,8,160,8,32,balanced,0.04465066889921824
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,6144,2560,8,160,8,32,balanced,0.11025066177050273
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,6144,2560,8,160,8,32,balanced,0.04629333317279816
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,6144,2560,8,160,8,32,balanced,0.08364799618721008
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,6144,2560,8,160,8,32,balanced,0.047594666481018066
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,6144,2560,8,160,8,32,balanced,0.12114666899045308
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,6144,2560,8,160,8,32,balanced,0.04878933231035868
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,6144,2560,8,160,8,32,balanced,0.0972160001595815
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,6144,2560,8,160,8,32,balanced,0.04911466439565023
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,6144,2560,8,160,8,32,balanced,0.15290133158365884
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,6144,2560,8,160,8,32,balanced,0.04948266843954722
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,6144,2560,8,160,8,32,balanced,0.10170666376749675
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,6144,2560,8,160,8,32,balanced,0.0505920002857844
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,6144,2560,8,160,8,32,balanced,0.18029866615931192
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,6144,2560,8,160,8,32,balanced,0.05129600067933401
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,6144,2560,8,160,8,32,balanced,0.051701332132021584
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,6144,2560,8,160,8,32,balanced,0.12236799796422322
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,6144,2560,8,160,8,32,balanced,0.05409066875775655
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,6144,2560,8,160,8,32,balanced,0.05401599903901418
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,6144,2560,8,160,8,32,balanced,0.24463999271392822
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,6144,2560,8,160,8,32,balanced,0.1388213336467743
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,6144,2560,8,160,8,32,balanced,0.057631999254226685
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,6144,2560,8,160,8,32,power_law_1.01,0.0681984007358551
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,6144,2560,8,160,8,32,balanced,0.06178666651248932
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,6144,2560,8,160,8,32,balanced,0.305786669254303
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,6144,2560,8,160,8,32,balanced,0.1788853406906128
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,6144,2560,8,160,8,32,power_law_1.01,0.06348800063133239
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,6144,2560,8,160,8,32,power_law_1.01,0.053990399837493895
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,6144,2560,8,160,8,32,balanced,0.06897599995136261
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,6144,2560,8,160,8,32,power_law_1.01,0.06362239718437195
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,6144,2560,8,160,8,32,power_law_1.01,0.06479359865188598
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,6144,2560,8,160,8,32,power_law_1.01,0.06750720143318176
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,6144,2560,8,160,8,32,balanced,0.21904534101486206
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,6144,2560,8,160,8,32,power_law_1.01,0.06786559820175171
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,6144,2560,8,160,8,32,balanced,0.42417065302530926
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,6144,2560,8,160,8,32,power_law_1.01,0.0680191993713379
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,6144,2560,8,160,8,32,balanced,0.07493866483370464
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,6144,2560,8,160,8,32,power_law_1.01,0.070796799659729
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,6144,2560,8,160,8,32,power_law_1.01,0.05836799740791321
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,6144,2560,8,160,8,32,power_law_1.01,0.07401599884033203
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,6144,2560,8,160,8,32,balanced,0.0804746647675832
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,6144,2560,8,160,8,32,power_law_1.01,0.070387202501297
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,6144,2560,8,160,8,32,power_law_1.01,0.05234559774398804
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,6144,2560,8,160,8,32,power_law_1.01,0.07143679857254029
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,6144,2560,8,160,8,32,power_law_1.01,0.04932479858398438
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,6144,2560,8,160,8,32,power_law_1.01,0.05026559829711914
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,6144,2560,8,160,8,32,power_law_1.01,0.07082239985466003
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,6144,2560,8,160,8,32,balanced,0.2927253246307373
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,6144,2560,8,160,8,32,power_law_1.01,0.05159040093421936
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,6144,2560,8,160,8,32,power_law_1.01,0.07817599773406983
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,6144,2560,8,160,8,32,power_law_1.01,0.05317760109901428
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,6144,2560,8,160,8,32,balanced,0.5505280097325643
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,6144,2560,8,160,8,32,power_law_1.01,0.08654720187187195
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,6144,2560,8,160,8,32,power_law_1.01,0.054073601961135864
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,6144,2560,8,160,8,32,balanced,0.0983786682287852
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,6144,2560,8,160,8,32,power_law_1.01,0.09544960260391236
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,6144,2560,8,160,8,32,power_law_1.01,0.05565440058708191
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,6144,2560,8,160,8,32,power_law_1.01,0.0803712010383606
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,6144,2560,8,160,8,32,power_law_1.01,0.05606399774551392
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,6144,2560,8,160,8,32,power_law_1.01,0.10576000213623046
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,6144,2560,8,160,8,32,balanced,0.11117333173751831
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,6144,2560,8,160,8,32,power_law_1.01,0.0566976010799408
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,6144,2560,8,160,8,32,power_law_1.01,0.11173759698867798
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,6144,2560,8,160,8,32,power_law_1.01,0.06097919940948486
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,6144,2560,8,160,8,32,power_law_1.01,0.06287999749183655
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,6144,2560,8,160,8,32,power_law_1.01,0.14220800399780273
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,6144,2560,8,160,8,32,power_law_1.01,0.04663040041923523
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,6144,2560,8,160,8,32,power_law_1.01,0.06444799900054932
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,6144,2560,8,160,8,32,power_law_1.01,0.1463487982749939
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,6144,2560,8,160,8,32,balanced,0.377130667368571
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,6144,2560,8,160,8,32,power_law_1.01,0.06629120111465454
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,6144,2560,8,160,8,32,power_law_1.01,0.045228800177574156
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,6144,2560,8,160,8,32,power_law_1.01,0.18844159841537475
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,6144,2560,8,160,8,32,power_law_1.01,0.07351679801940918
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,6144,2560,8,160,8,32,balanced,0.1437173287073771
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,6144,2560,8,160,8,32,power_law_1.01,0.04161919951438904
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,6144,2560,8,160,8,32,power_law_1.01,0.07813760042190551
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,6144,2560,8,160,8,32,power_law_1.01,0.22103679180145264
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,6144,2560,8,160,8,32,power_law_1.01,0.04671359956264496
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,6144,2560,8,160,8,32,power_law_1.01,0.0772159993648529
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,6144,2560,8,160,8,32,power_law_1.01,0.3196415901184082
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,6144,2560,8,160,8,32,balanced,0.6622506777445475
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,6144,2560,8,160,8,32,power_law_1.01,0.09990400075912476
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,6144,2560,8,160,8,32,power_law_1.01,0.04742400050163269
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,6144,2560,8,160,8,32,balanced,0.1686346729596456
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,6144,2560,8,160,8,32,power_law_1.01,0.37548160552978516
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,6144,2560,8,160,8,32,power_law_1.01,0.10723199844360351
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,6144,2560,8,160,8,32,power_law_1.01,0.04832000136375427
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,6144,2560,8,160,8,32,power_law_1.01,0.13640960454940795
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,6144,2560,8,160,8,32,power_law_1.01,0.04948480129241943
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,6144,2560,8,160,8,32,power_law_1.01,0.4913343906402588
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,6144,2560,8,160,8,32,power_law_1.01,0.14803199768066405
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,6144,2560,8,160,8,32,power_law_1.01,0.051148802042007446
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,6144,2560,8,160,8,32,power_law_1.01,0.19084160327911376
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,6144,2560,8,160,8,32,power_law_1.01,0.7429376125335694
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,6144,2560,8,160,8,32,power_law_1.01,0.05170559883117676
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,6144,2560,8,160,8,32,power_law_1.01,0.22945280075073243
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,6144,2560,8,160,8,32,power_law_1.01,0.054079997539520266
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,6144,2560,8,160,8,32,power_law_1.01,0.9090751647949219
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,6144,2560,8,160,8,32,power_law_1.01,0.34428160190582274
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,6144,2560,8,160,8,32,power_law_1.01,0.05507199764251709
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,6144,2560,8,160,8,32,power_law_1.01,0.42070398330688474
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,6144,2560,8,160,8,32,balanced,0.4434293508529663
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,6144,2560,8,160,8,32,balanced,0.22607467571894327
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,6144,2560,8,160,8,32,power_law_1.01,1.2140095710754395
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,6144,2560,8,160,8,32,power_law_1.01,0.058457601070404056
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,6144,2560,8,160,8,32,power_law_1.01,0.5804736137390136
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,6144,2560,8,160,8,32,power_law_1.2,0.0673088014125824
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,6144,2560,8,160,8,32,power_law_1.01,0.06336640119552613
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,6144,2560,8,160,8,32,power_law_1.01,0.8445568084716797
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,6144,2560,8,160,8,32,power_law_1.01,2.4740928649902343
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,6144,2560,8,160,8,32,power_law_1.01,0.06690559983253479
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,6144,2560,8,160,8,32,power_law_1.2,0.05807999968528747
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,6144,2560,8,160,8,32,power_law_1.01,0.9716863632202148
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,6144,2560,8,160,8,32,power_law_1.01,0.07259520292282104
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,6144,2560,8,160,8,32,power_law_1.2,0.05169919729232788
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,6144,2560,8,160,8,32,power_law_1.01,1.598316764831543
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,6144,2560,8,160,8,32,power_law_1.2,0.06227840185165405
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,6144,2560,8,160,8,32,power_law_1.2,0.05920640230178833
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,6144,2560,8,160,8,32,power_law_1.01,3.3648319244384766
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,6144,2560,8,160,8,32,power_law_1.01,0.07258880138397217
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,6144,2560,8,160,8,32,power_law_1.2,0.06466559767723083
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,6144,2560,8,160,8,32,power_law_1.2,0.05161600112915039
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,6144,2560,8,160,8,32,balanced,0.2964479923248291
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,6144,2560,8,160,8,32,power_law_1.2,0.06755840182304382
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,6144,2560,8,160,8,32,balanced,1.0326666831970215
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,6144,2560,8,160,8,32,power_law_1.01,0.0790719985961914
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,6144,2560,8,160,8,32,power_law_1.2,0.047577598690986635
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,6144,2560,8,160,8,32,power_law_1.2,0.06785280108451844
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,6144,2560,8,160,8,32,power_law_1.2,0.052108800411224364
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,6144,2560,8,160,8,32,power_law_1.2,0.06928640007972717
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,6144,2560,8,160,8,32,power_law_1.2,0.05245440006256104
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,6144,2560,8,160,8,32,power_law_1.2,0.07408000230789184
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,6144,2560,8,160,8,32,power_law_1.01,0.09802240133285522
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,6144,2560,8,160,8,32,power_law_1.2,0.055212801694869994
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,6144,2560,8,160,8,32,power_law_1.2,0.07750399708747864
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,6144,2560,8,160,8,32,power_law_1.01,0.11731200218200684
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,6144,2560,8,160,8,32,balanced,0.4269706805547078
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,6144,2560,8,160,8,32,power_law_1.2,0.07349119782447815
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,6144,2560,8,160,8,32,power_law_1.2,0.05553920269012451
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,6144,2560,8,160,8,32,balanced,0.6786879698435465
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,6144,2560,8,160,8,32,power_law_1.2,0.07338240146636962
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,6144,2560,8,160,8,32,power_law_1.2,0.057004797458648684
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,6144,2560,8,160,8,32,power_law_1.01,0.14088959693908693
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,6144,2560,8,160,8,32,power_law_1.2,0.07534080147743225
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,6144,2560,8,160,8,32,power_law_1.2,0.060159999132156375
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,6144,2560,8,160,8,32,power_law_1.01,0.17431679964065552
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,6144,2560,8,160,8,32,power_law_1.2,0.08049920201301575
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,6144,2560,8,160,8,32,power_law_1.2,0.059961599111557004
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,6144,2560,8,160,8,32,power_law_1.2,0.06227840185165405
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,6144,2560,8,160,8,32,power_law_1.2,0.09012479782104492
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,6144,2560,8,160,8,32,power_law_1.01,0.2522111892700195
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,6144,2560,8,160,8,32,power_law_1.2,0.0669376015663147
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,6144,2560,8,160,8,32,power_law_1.2,0.09945600032806397
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,6144,2560,8,160,8,32,power_law_1.01,0.32907519340515134
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,6144,2560,8,160,8,32,power_law_1.2,0.0705407977104187
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,6144,2560,8,160,8,32,power_law_1.2,0.09082239866256714
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,6144,2560,8,160,8,32,power_law_1.2,0.0726527988910675
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,6144,2560,8,160,8,32,power_law_1.01,0.40102400779724123
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,6144,2560,8,160,8,32,power_law_1.2,0.11048959493637085
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,6144,2560,8,160,8,32,power_law_1.2,0.07706239819526672
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,6144,2560,8,160,8,32,balanced,0.5625066757202148
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,6144,2560,8,160,8,32,power_law_1.2,0.1296704053878784
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,6144,2560,8,160,8,32,power_law_1.01,0.582144021987915
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,6144,2560,8,160,8,32,power_law_1.2,0.08764799833297729
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,6144,2560,8,160,8,32,power_law_1.2,0.1610751986503601
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,6144,2560,8,160,8,32,power_law_1.2,0.0900223970413208
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,6144,2560,8,160,8,32,power_law_1.01,0.8381952285766602
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,6144,2560,8,160,8,32,power_law_1.2,0.17295360565185547
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,6144,2560,8,160,8,32,power_law_1.2,0.10632319450378418
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,6144,2560,8,160,8,32,power_law_1.2,0.23204479217529297
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,6144,2560,8,160,8,32,power_law_1.01,1.2339648246765136
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,6144,2560,8,160,8,32,power_law_1.2,0.11812479496002197
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,6144,2560,8,160,8,32,power_law_1.2,0.26844799518585205
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,6144,2560,8,160,8,32,power_law_1.2,0.15370880365371703
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,6144,2560,8,160,8,32,power_law_1.01,1.4067008018493652
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,6144,2560,8,160,8,32,power_law_1.2,0.36126720905303955
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,6144,2560,8,160,8,32,power_law_1.2,0.49679999351501464
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,6144,2560,8,160,8,32,power_law_1.2,0.16740479469299316
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,6144,2560,8,160,8,32,power_law_1.01,2.219660758972168
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,6144,2560,8,160,8,32,power_law_1.2,0.8361599922180176
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,6144,2560,8,160,8,32,power_law_1.2,0.23873279094696045
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,6144,2560,8,160,8,32,balanced,0.6853066285451254
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,6144,2560,8,160,8,32,balanced,2.0389599800109863
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,6144,2560,8,160,8,32,power_law_1.2,0.2923583984375
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,6144,2560,8,160,8,32,power_law_1.01,4.0897216796875
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,6144,2560,8,160,8,32,power_law_1.2,0.9154623985290528
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,6144,2560,8,160,8,32,power_law_1.2,0.4105088233947754
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,6144,2560,8,160,8,32,power_law_1.2,1.2981120109558106
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,6144,2560,8,160,8,32,power_law_1.2,0.5276735782623291
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,6144,2560,8,160,8,32,power_law_1.2,2.167340850830078
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,6144,2560,8,160,8,32,power_law_1.2,0.7864575862884522
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,6144,2560,8,160,8,32,power_law_1.2,3.7929920196533202
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,6144,2560,8,160,8,32,power_law_1.2,1.1690176010131836
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,6144,2560,8,160,8,32,power_law_1.2,1.4584575653076173
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,6144,2560,8,160,8,32,balanced,1.3241386413574219
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,6144,2560,8,160,8,32,power_law_1.2,2.114771270751953
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,6144,2560,8,160,8,32,power_law_1.2,5.25854721069336
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,6144,2560,8,160,8,32,balanced,1.0639893213907878
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,6144,2560,8,160,8,32,balanced,2.0984907150268555
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,6144,2560,8,160,16,16,balanced,0.05130666494369507
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,6144,2560,8,160,8,32,power_law_1.2,0.04650239944458008
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,6144,2560,8,160,16,16,balanced,0.050954664746920265
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,6144,2560,8,160,8,32,power_law_1.2,0.04387199878692627
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,6144,2560,8,160,16,16,balanced,0.052111998200416565
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,6144,2560,8,160,8,32,power_law_1.2,0.042745599150657655
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,6144,2560,8,160,16,16,balanced,0.05499733487764994
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,6144,2560,8,160,8,32,power_law_1.2,0.045311999320983884
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,6144,2560,8,160,16,16,balanced,0.06448000172773997
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,6144,2560,8,160,8,32,power_law_1.2,0.046828800439834596
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,6144,2560,8,160,16,16,balanced,0.06897066533565521
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,6144,2560,8,160,16,16,balanced,0.06866666674613953
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,6144,2560,8,160,8,32,power_law_1.2,0.04801279902458191
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,6144,2560,8,160,16,16,balanced,0.07117333511511485
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,6144,2560,8,160,8,32,power_law_1.2,0.05030400156974792
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,6144,2560,8,160,16,16,balanced,0.06966933111349742
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,6144,2560,8,160,8,32,power_law_1.2,0.05112959742546082
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,6144,2560,8,160,16,16,balanced,0.07127999762694041
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,6144,2560,8,160,8,32,power_law_1.2,0.05422719717025757
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,6144,2560,8,160,16,16,balanced,0.07201600074768066
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,6144,2560,8,160,8,32,power_law_1.2,0.05607680082321167
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,6144,2560,8,160,16,16,balanced,0.07274133463700612
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,6144,2560,8,160,8,32,power_law_1.2,0.05836799740791321
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,6144,2560,8,160,16,16,balanced,0.07240533332029979
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,6144,2560,8,160,16,16,balanced,0.07520000139872234
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,6144,2560,8,160,8,32,power_law_1.2,0.06026880145072937
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,6144,2560,8,160,8,32,power_law_1.2,0.06410239934921265
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,6144,2560,8,160,16,16,balanced,0.07947733501593272
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,6144,2560,8,160,8,32,power_law_1.2,0.06853119730949402
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,6144,2560,8,160,16,16,balanced,0.0788800021012624
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,6144,2560,8,160,8,32,power_law_1.2,0.07427840232849121
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,6144,2560,8,160,16,16,balanced,0.08186133205890656
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,6144,2560,8,160,16,16,balanced,0.09850666920344035
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,6144,2560,8,160,8,32,power_law_1.2,0.08556159734725952
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,6144,2560,8,160,16,16,balanced,0.09103467067082723
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,6144,2560,8,160,8,32,power_law_1.2,0.08803200125694274
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,6144,2560,8,160,16,16,balanced,0.12055466572443645
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,6144,2560,8,160,16,16,balanced,0.04535466432571411
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,6144,2560,8,160,16,16,balanced,0.11169600486755371
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,6144,2560,8,160,8,32,power_law_1.2,0.10944000482559205
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,6144,2560,8,160,16,16,balanced,0.04651199777921041
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,6144,2560,8,160,8,32,power_law_1.2,0.129094398021698
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,6144,2560,8,160,16,16,balanced,0.04655999938646952
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,6144,2560,8,160,16,16,balanced,0.15313599507013956
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,6144,2560,8,160,16,16,balanced,0.05310399830341339
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,6144,2560,8,160,16,16,balanced,0.054234668612480164
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,6144,2560,8,160,16,16,balanced,0.0572266678015391
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,6144,2560,8,160,8,32,power_law_1.2,0.15132800340652466
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,6144,2560,8,160,16,16,balanced,0.05793599784374237
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,6144,2560,8,160,16,16,balanced,0.16486933827400208
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,6144,2560,8,160,16,16,balanced,0.05872533222039541
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,6144,2560,8,160,8,32,power_law_1.2,0.2234560012817383
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,6144,2560,8,160,16,16,balanced,0.05949333310127258
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,6144,2560,8,160,16,16,balanced,0.04093866546948751
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,6144,2560,8,160,16,16,balanced,0.05955733358860016
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,6144,2560,8,160,16,16,balanced,0.06101333101590475
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,6144,2560,8,160,16,16,balanced,0.04189866781234741
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,6144,2560,8,160,8,32,power_law_1.2,0.2818432092666626
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,6144,2560,8,160,16,16,power_law_1.01,0.07586560249328614
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,6144,2560,8,160,16,16,balanced,0.06057066718737284
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,6144,2560,8,160,16,16,balanced,0.04252799848715464
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,6144,2560,8,160,16,16,balanced,0.2291839917500814
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,6144,2560,8,160,8,32,power_law_1.2,0.4247744083404541
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,6144,2560,8,160,16,16,balanced,0.0621013343334198
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,6144,2560,8,160,16,16,balanced,0.04762133459250132
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,6144,2560,8,160,16,16,power_law_1.01,0.06721280217170715
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,6144,2560,8,160,16,16,balanced,0.06469866633415222
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,6144,2560,8,160,16,16,balanced,0.0495413343111674
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,6144,2560,8,160,16,16,balanced,0.06761600077152252
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,6144,2560,8,160,16,16,power_law_1.01,0.05196160078048706
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,6144,2560,8,160,16,16,balanced,0.051856001218159996
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,6144,2560,8,160,8,32,power_law_1.2,0.5339968204498291
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,6144,2560,8,160,16,16,balanced,0.07217066486676534
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,6144,2560,8,160,16,16,power_law_1.01,0.05798400044441223
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,6144,2560,8,160,16,16,balanced,0.053413331508636475
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,6144,2560,8,160,16,16,balanced,0.07611200213432312
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,6144,2560,8,160,16,16,balanced,0.26713599761327106
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,6144,2560,8,160,16,16,balanced,0.0537066658337911
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,6144,2560,8,160,16,16,power_law_1.01,0.06035199761390686
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,6144,2560,8,160,16,16,balanced,0.09614400068918864
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,6144,2560,8,160,8,32,power_law_1.2,0.768671989440918
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,6144,2560,8,160,16,16,balanced,0.05418666700522105
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,6144,2560,8,160,16,16,balanced,0.09411199887593587
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,6144,2560,8,160,16,16,power_law_1.01,0.06480000019073487
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,6144,2560,8,160,8,32,power_law_1.2,1.2606975555419921
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,6144,2560,8,160,16,16,balanced,0.05494399865468343
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,6144,2560,8,160,16,16,balanced,0.12156266967455547
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,6144,2560,8,160,16,16,power_law_1.01,0.0664192020893097
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,6144,2560,8,160,16,16,balanced,0.05735999842484792
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,6144,2560,8,160,16,16,power_law_1.01,0.06993280053138733
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,6144,2560,8,160,16,16,balanced,0.12691733241081238
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,6144,2560,8,160,8,32,power_law_1.2,1.6571136474609376
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,6144,2560,8,160,16,16,balanced,0.05707733333110809
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,6144,2560,8,160,16,16,power_law_1.01,0.07028480172157288
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,6144,2560,8,160,16,16,power_law_1.01,0.05859839916229248
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,6144,2560,8,160,16,16,balanced,0.05922666688760122
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,6144,2560,8,160,8,32,power_law_1.2,1.8856447219848633
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,6144,2560,8,160,16,16,balanced,0.3857119878133138
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,6144,2560,8,160,16,16,balanced,0.17694934209187826
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,6144,2560,8,160,16,16,power_law_1.01,0.07210239768028259
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,6144,2560,8,160,16,16,power_law_1.01,0.05564799904823303
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,6144,2560,8,160,16,16,balanced,0.06085866689682007
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,6144,2560,8,160,16,16,power_law_1.01,0.07438079714775085
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,6144,2560,8,160,8,32,power_law_1.2,3.47852783203125
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,6144,2560,8,160,16,16,balanced,0.06484800080458324
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,6144,2560,8,160,16,16,power_law_1.01,0.05129600167274475
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,6144,2560,8,160,16,16,power_law_1.01,0.04785920083522797
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,6144,2560,8,160,16,16,balanced,0.20096000035603842
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,6144,2560,8,160,16,16,power_law_1.01,0.07778559923171997
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,6144,2560,8,160,16,16,power_law_1.01,0.05271040201187134
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,6144,2560,8,160,16,16,power_law_1.01,0.0500927984714508
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,6144,2560,8,160,8,32,power_law_1.2,8.343199920654296
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,6144,2560,8,160,16,16,power_law_1.01,0.07592319846153259
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,6144,2560,8,160,16,16,balanced,0.06936533252398173
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,6144,2560,8,160,16,16,power_law_1.01,0.052960002422332765
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,6144,2560,8,160,16,16,power_law_1.01,0.04579200148582459
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,6144,2560,8,160,16,16,power_law_1.01,0.07985280156135559
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,6144,2560,8,160,16,16,power_law_1.01,0.05663999915122986
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,6144,2560,8,160,16,16,balanced,0.2760266661643982
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,6144,2560,8,160,16,16,power_law_1.01,0.048256000876426695
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,6144,2560,8,160,16,16,power_law_1.01,0.082777601480484
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,6144,2560,8,160,16,16,balanced,0.07517333328723907
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,6144,2560,8,160,16,16,power_law_1.01,0.05725439786911011
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,6144,2560,8,160,16,16,power_law_1.01,0.04830079972743988
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,6144,2560,8,160,16,16,balanced,0.4566613435745239
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,6144,2560,8,160,16,16,power_law_1.01,0.08952320218086243
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,6144,2560,8,160,16,16,power_law_1.01,0.05792639851570129
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,6144,2560,8,160,16,16,power_law_1.01,0.05308799743652344
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,6144,2560,8,160,16,16,power_law_1.01,0.09434239864349366
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,6144,2560,8,160,16,16,power_law_1.01,0.058745598793029784
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,6144,2560,8,160,16,16,balanced,0.34327467282613117
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,6144,2560,8,160,16,16,power_law_1.01,0.05427200198173523
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,6144,2560,8,160,16,16,power_law_1.01,0.1167296051979065
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,6144,2560,8,160,16,16,power_law_1.01,0.060659199953079224
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,6144,2560,8,160,16,16,power_law_1.01,0.05578879714012146
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,6144,2560,8,160,16,16,balanced,0.0862506628036499
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,6144,2560,8,160,16,16,power_law_1.01,0.12951040267944336
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,6144,2560,8,160,16,16,power_law_1.01,0.06455039978027344
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,6144,2560,8,160,16,16,power_law_1.01,0.05759360194206238
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,6144,2560,8,160,16,16,balanced,0.09733333190282185
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,6144,2560,8,160,16,16,power_law_1.01,0.1511296033859253
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,6144,2560,8,160,16,16,power_law_1.01,0.06549760103225707
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,6144,2560,8,160,16,16,power_law_1.01,0.05963519811630249
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,6144,2560,8,160,16,16,power_law_1.01,0.17620480060577393
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,6144,2560,8,160,16,16,power_law_1.01,0.07144960165023803
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,6144,2560,8,160,16,16,power_law_1.01,0.06202239990234375
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,6144,2560,8,160,16,16,balanced,0.49720001220703125
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,6144,2560,8,160,16,16,power_law_1.01,0.06709759831428527
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,6144,2560,8,160,16,16,power_law_1.01,0.07008640170097351
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,6144,2560,8,160,16,16,power_law_1.01,0.22101759910583496
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,6144,2560,8,160,16,16,balanced,0.5324906508127848
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,6144,2560,8,160,16,16,power_law_1.01,0.06855040192604064
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,6144,2560,8,160,16,16,power_law_1.01,0.23590400218963622
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,6144,2560,8,160,16,16,power_law_1.01,0.07781760096549988
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,6144,2560,8,160,16,16,balanced,0.11821333567301433
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,6144,2560,8,160,16,16,power_law_1.01,0.07363200187683105
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,6144,2560,8,160,16,16,power_law_1.01,0.08076800107955932
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,6144,2560,8,160,16,16,power_law_1.01,0.3270080089569092
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,6144,2560,8,160,16,16,power_law_1.01,0.08279039859771728
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,6144,2560,8,160,16,16,power_law_1.01,0.09040639996528625
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,6144,2560,8,160,16,16,balanced,0.1347040037314097
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,6144,2560,8,160,16,16,power_law_1.01,0.4129792213439941
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,6144,2560,8,160,16,16,power_law_1.01,0.10673279762268066
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,6144,2560,8,160,16,16,power_law_1.01,0.5949696063995361
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,6144,2560,8,160,16,16,power_law_1.01,0.08138239979743958
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,6144,2560,8,160,16,16,power_law_1.01,0.11937919855117798
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,6144,2560,8,160,16,16,balanced,0.6149013439814249
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,6144,2560,8,160,16,16,power_law_1.01,0.7991744041442871
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,6144,2560,8,160,16,16,power_law_1.01,0.14803839921951295
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,6144,2560,8,160,16,16,power_law_1.01,0.09594240188598632
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,6144,2560,8,160,16,16,balanced,0.18190399805704752
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,6144,2560,8,160,16,16,power_law_1.01,0.9056575775146485
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,6144,2560,8,160,16,16,power_law_1.01,0.16433279514312743
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,6144,2560,8,160,16,16,power_law_1.01,1.41014404296875
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,6144,2560,8,160,16,16,power_law_1.01,0.21842560768127442
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,6144,2560,8,160,16,16,balanced,0.22804266214370728
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,6144,2560,8,160,16,16,power_law_1.01,0.11621760129928589
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,6144,2560,8,160,16,16,power_law_1.01,0.24956800937652587
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,6144,2560,8,160,16,16,power_law_1.01,2.904115104675293
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,6144,2560,8,160,16,16,power_law_1.01,0.1347264051437378
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,6144,2560,8,160,16,16,power_law_1.2,0.07601280212402343
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,6144,2560,8,160,16,16,power_law_1.01,0.35253760814666746
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,6144,2560,8,160,16,16,power_law_1.2,0.06255360245704651
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,6144,2560,8,160,16,16,power_law_1.01,0.4850304126739502
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,6144,2560,8,160,16,16,balanced,0.8521173000335693
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,6144,2560,8,160,16,16,power_law_1.2,0.051910400390625
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,6144,2560,8,160,16,16,power_law_1.01,0.15799039602279663
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,6144,2560,8,160,16,16,power_law_1.01,0.6885056018829345
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,6144,2560,8,160,16,16,balanced,0.7431306838989258
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,6144,2560,8,160,16,16,power_law_1.2,0.057651197910308837
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,6144,2560,8,160,16,16,power_law_1.01,0.20289919376373292
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,6144,2560,8,160,16,16,balanced,0.3325066765149434
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,6144,2560,8,160,16,16,power_law_1.01,0.8467840194702149
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,6144,2560,8,160,16,16,power_law_1.2,0.061324799060821535
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,6144,2560,8,160,16,16,power_law_1.01,1.1131711959838868
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,6144,2560,8,160,16,16,power_law_1.01,0.27790720462799073
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,6144,2560,8,160,16,16,power_law_1.2,0.06514559984207154
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,6144,2560,8,160,16,16,power_law_1.01,0.3897919893264771
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,6144,2560,8,160,16,16,power_law_1.01,1.6465471267700196
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,6144,2560,8,160,16,16,power_law_1.2,0.0671231985092163
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,6144,2560,8,160,16,16,balanced,0.42742399374643963
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,6144,2560,8,160,16,16,power_law_1.2,0.06967679858207702
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,6144,2560,8,160,16,16,power_law_1.01,3.2578880310058596
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,6144,2560,8,160,16,16,power_law_1.01,0.5398335933685303
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,6144,2560,8,160,16,16,power_law_1.2,0.0699072003364563
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,6144,2560,8,160,16,16,power_law_1.01,0.7780479907989502
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,6144,2560,8,160,16,16,power_law_1.2,0.0714303970336914
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,6144,2560,8,160,16,16,power_law_1.2,0.07383040189743043
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,6144,2560,8,160,16,16,power_law_1.2,0.07681919932365418
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,6144,2560,8,160,16,16,power_law_1.01,1.0733247756958009
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,6144,2560,8,160,16,16,power_law_1.2,0.08013439774513245
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,6144,2560,8,160,16,16,balanced,0.6127573251724243
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,6144,2560,8,160,16,16,power_law_1.01,1.2653696060180664
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,6144,2560,8,160,16,16,power_law_1.2,0.07994880080223084
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,6144,2560,8,160,16,16,balanced,1.17740797996521
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,6144,2560,8,160,16,16,power_law_1.01,1.7932159423828125
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,6144,2560,8,160,16,16,power_law_1.2,0.08568320274353028
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,6144,2560,8,160,16,16,power_law_1.2,0.09253119826316833
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,6144,2560,8,160,16,16,power_law_1.01,2.702764892578125
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,6144,2560,8,160,16,16,power_law_1.2,0.09905279874801635
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,6144,2560,8,160,16,16,power_law_1.2,0.12721920013427734
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,6144,2560,8,160,16,16,power_law_1.01,5.840633773803711
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,6144,2560,8,160,16,16,balanced,0.7917333443959554
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,6144,2560,8,160,16,16,power_law_1.2,0.1286784052848816
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,6144,2560,8,160,16,16,power_law_1.2,0.16299519538879395
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,6144,2560,8,160,16,16,power_law_1.2,0.17688319683074952
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,6144,2560,8,160,16,16,power_law_1.2,0.259334397315979
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,6144,2560,8,160,16,16,balanced,1.6144372622172039
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,6144,2560,8,160,16,16,power_law_1.2,0.2771967887878418
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,6144,2560,8,160,16,16,power_law_1.2,0.38679039478302
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,6144,2560,8,160,16,16,power_law_1.2,0.5235519886016846
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,6144,2560,8,160,16,16,balanced,0.9645813306172689
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,6144,2560,8,160,16,16,power_law_1.2,0.6695807933807373
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,6144,2560,8,160,16,16,power_law_1.2,0.9638912200927734
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,6144,2560,8,160,16,16,power_law_1.2,1.3047231674194335
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,6144,2560,8,160,16,16,power_law_1.2,1.9837055206298828
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,6144,2560,8,160,16,16,power_law_1.2,3.9886913299560547
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,6144,2560,8,160,16,16,balanced,2.298389275868734
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,6144,2560,8,160,16,16,balanced,1.5152907371520996
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,6144,2560,8,160,16,16,power_law_1.2,0.05896959900856018
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,6144,2560,8,160,16,16,power_law_1.2,0.051718401908874514
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,6144,2560,8,160,16,16,power_law_1.2,0.04750719964504242
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,6144,2560,8,160,16,16,power_law_1.2,0.05372160077095032
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,6144,2560,8,160,16,16,power_law_1.2,0.05255680084228516
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,6144,2560,8,160,16,16,power_law_1.2,0.0564736008644104
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,6144,2560,8,160,16,16,power_law_1.2,0.05746560096740723
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,6144,2560,8,160,16,16,power_law_1.2,0.05849599838256836
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,6144,2560,8,160,16,16,power_law_1.2,0.0598143994808197
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,6144,2560,8,160,16,16,power_law_1.2,0.061638402938842776
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,6144,2560,8,160,16,16,power_law_1.2,0.06417919993400574
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,6144,2560,8,160,16,16,power_law_1.2,0.06814720034599304
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,6144,2560,8,160,16,16,power_law_1.2,0.07055360078811646
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,6144,2560,8,160,16,16,power_law_1.2,0.06992639899253845
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,6144,2560,8,160,16,16,power_law_1.2,0.07996799945831298
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,6144,2560,8,160,16,16,power_law_1.2,0.08356480002403259
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,6144,2560,8,160,16,16,power_law_1.2,0.0927295982837677
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,6144,2560,8,160,16,16,power_law_1.2,0.11272959709167481
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,6144,2560,8,160,16,16,balanced,2.9956534703572593
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,6144,2560,8,160,16,16,power_law_1.2,0.1259392023086548
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,6144,2560,8,160,16,16,power_law_1.2,0.16606080532073975
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,6144,2560,8,160,16,16,power_law_1.2,0.1806399941444397
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,6144,2560,8,160,16,16,power_law_1.2,0.23895039558410644
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,6144,2560,8,160,16,16,power_law_1.2,0.2701184034347534
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,6144,2560,8,160,16,16,power_law_1.2,0.40750718116760254
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,6144,2560,8,160,16,16,power_law_1.2,0.5212031841278076
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,6144,2560,8,160,16,16,power_law_1.2,0.7500031948089599
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,6144,2560,8,160,16,16,power_law_1.2,1.0770815849304198
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,6144,2560,8,160,16,16,power_law_1.2,1.2087295532226563
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,6144,2560,8,160,16,16,power_law_1.2,2.13767032623291
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,6144,2560,8,160,16,16,power_law_1.2,5.3222911834716795
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,6144,2560,8,160,16,16,power_law_1.2,0.05139200091361999
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,6144,2560,8,160,16,16,power_law_1.2,0.045977601408958436
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,6144,2560,8,160,16,16,power_law_1.2,0.04477440118789673
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,6144,2560,8,160,32,8,balanced,0.05209066470464071
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,6144,2560,8,160,16,16,power_law_1.2,0.047705599665641786
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,6144,2560,8,160,32,8,balanced,0.05176533261934916
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,6144,2560,8,160,16,16,power_law_1.2,0.049619200825691226
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,6144,2560,8,160,32,8,balanced,0.05333333214124044
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,6144,2560,8,160,32,8,balanced,0.057162667314211525
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,6144,2560,8,160,16,16,power_law_1.2,0.05299199819564819
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,6144,2560,8,160,32,8,balanced,0.06638933221499126
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,6144,2560,8,160,16,16,power_law_1.2,0.05472000241279602
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,6144,2560,8,160,32,8,balanced,0.07372266550858815
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,6144,2560,8,160,16,16,power_law_1.2,0.056652802228927615
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,6144,2560,8,160,32,8,balanced,0.046112000942230225
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,6144,2560,8,160,32,8,balanced,0.07358933488527934
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,6144,2560,8,160,16,16,power_law_1.2,0.058278399705886844
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,6144,2560,8,160,32,8,balanced,0.04713066418965658
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,6144,2560,8,160,32,8,balanced,0.07613866527875264
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,6144,2560,8,160,32,8,balanced,0.04808000226815542
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,6144,2560,8,160,16,16,power_law_1.2,0.060736000537872314
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,6144,2560,8,160,32,8,balanced,0.07437333464622498
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,6144,2560,8,160,32,8,balanced,0.05342400074005127
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,6144,2560,8,160,32,8,balanced,0.07623999814192454
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,6144,2560,8,160,16,16,power_law_1.2,0.063673597574234
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,6144,2560,8,160,32,8,balanced,0.05845866600672404
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,6144,2560,8,160,32,8,balanced,0.0749066670735677
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,6144,2560,8,160,16,16,power_law_1.2,0.06818559765815735
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,6144,2560,8,160,32,8,balanced,0.06163200239340464
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,6144,2560,8,160,32,8,balanced,0.07622933387756348
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,6144,2560,8,160,16,16,power_law_1.2,0.07061759829521179
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,6144,2560,8,160,32,8,balanced,0.06309333443641663
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,6144,2560,8,160,32,8,balanced,0.07878399888674419
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,6144,2560,8,160,16,16,power_law_1.2,0.0790719985961914
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,6144,2560,8,160,32,8,balanced,0.0634080022573471
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,6144,2560,8,160,32,8,balanced,0.07855999966462453
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,6144,2560,8,160,16,16,power_law_1.2,0.08195199966430664
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,6144,2560,8,160,32,8,balanced,0.06294399996598561
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,6144,2560,8,160,32,8,balanced,0.08271466692288716
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,6144,2560,8,160,32,8,balanced,0.06534400085608165
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,6144,2560,8,160,32,8,balanced,0.08741333087285359
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,6144,2560,8,160,16,16,power_law_1.2,0.08935040235519409
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,6144,2560,8,160,32,8,balanced,0.06484800080458324
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,6144,2560,8,160,32,8,balanced,0.08878399928410848
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,6144,2560,8,160,32,8,balanced,0.06588266789913177
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,6144,2560,8,160,32,8,balanced,0.1102133293946584
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,6144,2560,8,160,16,16,power_law_1.2,0.10128639936447144
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,6144,2560,8,160,32,8,balanced,0.06713066498438518
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,6144,2560,8,160,32,8,balanced,0.10754666725794475
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,6144,2560,8,160,32,8,balanced,0.07100800176461537
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,6144,2560,8,160,32,8,balanced,0.07517866790294647
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,6144,2560,8,160,16,16,power_law_1.2,0.12175999879837036
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,6144,2560,8,160,32,8,balanced,0.1254026691118876
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,6144,2560,8,160,32,8,balanced,0.08061866462230682
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,6144,2560,8,160,16,16,power_law_1.2,0.14075520038604736
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,6144,2560,8,160,32,8,balanced,0.13428266843159994
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,6144,2560,8,160,32,8,balanced,0.08543466528256734
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,6144,2560,8,160,32,8,balanced,0.10874666770299275
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,6144,2560,8,160,16,16,power_law_1.2,0.21045761108398436
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,6144,2560,8,160,32,8,balanced,0.21008533239364624
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,6144,2560,8,160,32,8,balanced,0.11012267072995503
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,6144,2560,8,160,16,16,power_law_1.2,0.23028481006622314
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,6144,2560,8,160,32,8,balanced,0.13170133034388223
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,6144,2560,8,160,32,8,balanced,0.2104640007019043
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,6144,2560,8,160,32,8,power_law_1.01,0.05642240047454834
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,6144,2560,8,160,16,16,power_law_1.2,0.36576640605926514
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,6144,2560,8,160,32,8,power_law_1.01,0.05041279792785645
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,6144,2560,8,160,32,8,balanced,0.14826132853825888
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,6144,2560,8,160,16,16,power_law_1.2,0.42554240226745604
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,6144,2560,8,160,32,8,power_law_1.01,0.06507520079612732
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,6144,2560,8,160,32,8,power_law_1.01,0.05434880256652832
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,6144,2560,8,160,32,8,power_law_1.01,0.053395199775695804
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,6144,2560,8,160,32,8,balanced,0.30320000648498535
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,6144,2560,8,160,16,16,power_law_1.2,0.6495232105255127
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,6144,2560,8,160,32,8,power_law_1.01,0.05800960063934326
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,6144,2560,8,160,32,8,power_law_1.01,0.04836480021476745
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,6144,2560,8,160,32,8,balanced,0.2160053253173828
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,6144,2560,8,160,32,8,power_law_1.01,0.0530239999294281
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,6144,2560,8,160,16,16,power_law_1.2,0.9547007560729981
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,6144,2560,8,160,32,8,power_law_1.01,0.06202239990234375
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,6144,2560,8,160,32,8,power_law_1.01,0.054476797580718994
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,6144,2560,8,160,32,8,power_law_1.01,0.07095680236816407
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,6144,2560,8,160,32,8,balanced,0.24406933784484863
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,6144,2560,8,160,16,16,power_law_1.2,1.43121280670166
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,6144,2560,8,160,32,8,power_law_1.01,0.059910398721694944
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,6144,2560,8,160,32,8,power_law_1.01,0.07289599776268005
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,6144,2560,8,160,32,8,balanced,0.36554133892059326
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,6144,2560,8,160,32,8,power_law_1.01,0.06053760051727295
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,6144,2560,8,160,16,16,power_law_1.2,1.5866432189941406
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,6144,2560,8,160,32,8,power_law_1.01,0.07136639952659607
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,6144,2560,8,160,32,8,power_law_1.01,0.061868798732757566
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,6144,2560,8,160,32,8,balanced,0.34869333108266193
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,6144,2560,8,160,32,8,power_law_1.01,0.07272959947586059
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,6144,2560,8,160,16,16,power_law_1.2,2.380780792236328
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,6144,2560,8,160,32,8,power_law_1.01,0.0639743983745575
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,6144,2560,8,160,32,8,power_law_1.01,0.07520639896392822
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,6144,2560,8,160,32,8,power_law_1.01,0.06686720252037048
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,6144,2560,8,160,16,16,power_law_1.2,3.5513790130615233
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,6144,2560,8,160,32,8,power_law_1.01,0.06817280054092408
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,6144,2560,8,160,32,8,power_law_1.01,0.0790719985961914
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,6144,2560,8,160,32,8,balanced,0.49930667877197266
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,6144,2560,8,160,32,8,power_law_1.01,0.07187839746475219
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,6144,2560,8,160,32,8,power_law_1.01,0.08056319952011108
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,6144,2560,8,160,16,16,power_law_1.2,9.010399627685548
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,6144,2560,8,160,32,8,balanced,0.43839999039967853
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,6144,2560,8,160,32,8,power_law_1.01,0.07616639733314515
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,6144,2560,8,160,32,8,power_law_1.01,0.08300160169601441
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,6144,2560,8,160,32,8,power_law_1.01,0.07697920203208923
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,6144,2560,8,160,32,8,power_law_1.01,0.08581119775772095
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,6144,2560,8,160,32,8,power_law_1.01,0.0832319974899292
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,6144,2560,8,160,32,8,power_law_1.01,0.09249920248985291
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,6144,2560,8,160,32,8,power_law_1.01,0.08957440257072449
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,6144,2560,8,160,32,8,power_law_1.01,0.09871360063552856
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,6144,2560,8,160,32,8,power_law_1.01,0.10051840543746948
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,6144,2560,8,160,32,8,balanced,0.6217173337936401
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,6144,2560,8,160,32,8,power_law_1.01,0.11741440296173096
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,6144,2560,8,160,32,8,power_law_1.01,0.10165760517120362
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,6144,2560,8,160,32,8,balanced,0.6418613195419312
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,6144,2560,8,160,32,8,power_law_1.01,0.12602239847183228
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,6144,2560,8,160,32,8,power_law_1.01,0.12328319549560547
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,6144,2560,8,160,32,8,power_law_1.01,0.15211520195007325
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,6144,2560,8,160,32,8,power_law_1.01,0.1255295991897583
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,6144,2560,8,160,32,8,power_law_1.01,0.18944640159606935
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,6144,2560,8,160,32,8,power_law_1.01,0.1476863980293274
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,6144,2560,8,160,32,8,power_law_1.01,0.20067200660705567
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,6144,2560,8,160,32,8,power_law_1.01,0.2390144109725952
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,6144,2560,8,160,32,8,power_law_1.01,0.2625983953475952
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,6144,2560,8,160,32,8,power_law_1.01,0.29109759330749513
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,6144,2560,8,160,32,8,balanced,0.7925439675649008
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,6144,2560,8,160,32,8,power_law_1.01,0.28495359420776367
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,6144,2560,8,160,32,8,power_law_1.01,0.4097792148590088
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,6144,2560,8,160,32,8,power_law_1.01,0.4892672061920166
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,6144,2560,8,160,32,8,power_law_1.01,0.37189760208129885
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,6144,2560,8,160,32,8,balanced,0.758016029993693
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,6144,2560,8,160,32,8,power_law_1.01,0.7553664207458496
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,6144,2560,8,160,32,8,power_law_1.01,0.48148479461669924
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,6144,2560,8,160,32,8,power_law_1.01,1.0603008270263672
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,6144,2560,8,160,32,8,power_law_1.01,0.7014272212982178
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,6144,2560,8,160,32,8,power_law_1.01,1.2863743782043457
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,6144,2560,8,160,32,8,power_law_1.01,0.8993984222412109
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,6144,2560,8,160,32,8,power_law_1.01,2.0005632400512696
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,6144,2560,8,160,32,8,power_law_1.01,1.0701760292053222
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,6144,2560,8,160,32,8,power_law_1.01,1.7700288772583008
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,6144,2560,8,160,32,8,power_law_1.01,4.246316909790039
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,6144,2560,8,160,32,8,balanced,0.9603573481241862
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,6144,2560,8,160,32,8,power_law_1.01,3.501094436645508
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,6144,2560,8,160,32,8,balanced,1.1808213392893474
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,6144,2560,8,160,32,8,power_law_1.2,0.05726720094680786
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,6144,2560,8,160,32,8,power_law_1.2,0.05488640069961548
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,6144,2560,8,160,32,8,power_law_1.2,0.05280640125274658
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,6144,2560,8,160,32,8,power_law_1.2,0.059648001194000246
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,6144,2560,8,160,32,8,power_law_1.2,0.06396160125732422
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,6144,2560,8,160,32,8,power_law_1.2,0.06922879815101624
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,6144,2560,8,160,32,8,balanced,1.4842400550842285
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,6144,2560,8,160,32,8,power_law_1.2,0.07338240146636962
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,6144,2560,8,160,32,8,power_law_1.2,0.07397119998931885
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,6144,2560,8,160,32,8,power_law_1.2,0.0720575988292694
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,6144,2560,8,160,32,8,power_law_1.2,0.07797759771347046
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,6144,2560,8,160,32,8,power_law_1.2,0.07753599882125854
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,6144,2560,8,160,32,8,power_law_1.2,0.08210560083389282
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,6144,2560,8,160,32,8,power_law_1.2,0.08542720079421998
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,6144,2560,8,160,32,8,power_law_1.2,0.08982399702072144
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,6144,2560,8,160,32,8,power_law_1.2,0.09603840112686157
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,6144,2560,8,160,32,8,power_law_1.2,0.09998720288276672
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,6144,2560,8,160,32,8,power_law_1.2,0.10808320045471191
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,6144,2560,8,160,32,8,power_law_1.2,0.12934399843215943
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,6144,2560,8,160,32,8,power_law_1.2,0.12991360425949097
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,6144,2560,8,160,32,8,power_law_1.2,0.1545024037361145
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,6144,2560,8,160,32,8,power_law_1.2,0.2106112003326416
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,6144,2560,8,160,32,8,power_law_1.2,0.25090560913085935
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,6144,2560,8,160,32,8,power_law_1.2,0.2773119926452637
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,6144,2560,8,160,32,8,power_law_1.2,0.4446720123291016
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,6144,2560,8,160,32,8,power_law_1.2,0.5825535774230957
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,6144,2560,8,160,32,8,power_law_1.2,0.8041664123535156
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,6144,2560,8,160,32,8,power_law_1.2,1.0697088241577148
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,6144,2560,8,160,32,8,power_law_1.2,1.2846336364746094
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,6144,2560,8,160,32,8,power_law_1.2,2.074720001220703
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,6144,2560,8,160,32,8,balanced,2.2808052698771157
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,6144,2560,8,160,32,8,power_law_1.2,5.210867309570313
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,6144,2560,8,160,32,8,balanced,2.9406986236572266
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,6144,2560,8,160,32,8,power_law_1.2,0.04991360008716583
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,6144,2560,8,160,32,8,power_law_1.2,0.04891520142555237
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,6144,2560,8,160,32,8,power_law_1.2,0.0483711987733841
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,6144,2560,8,160,32,8,power_law_1.2,0.051769602298736575
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,6144,2560,8,160,32,8,power_law_1.2,0.053472000360488894
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,6144,2560,8,160,32,8,power_law_1.2,0.059436798095703125
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,6144,2560,8,160,32,8,power_law_1.2,0.06107519865036011
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,6144,2560,8,160,32,8,power_law_1.2,0.062067198753356936
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,6144,2560,8,160,32,8,power_law_1.2,0.06464639902114869
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,6144,2560,8,160,32,8,power_law_1.2,0.06546559929847717
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,6144,2560,8,160,32,8,power_law_1.2,0.07069439888000488
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,6144,2560,8,160,32,8,power_law_1.2,0.07216640114784241
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,6144,2560,8,160,32,8,power_law_1.2,0.07742720246315002
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,6144,2560,8,160,32,8,power_law_1.2,0.07795199751853943
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,6144,2560,8,160,32,8,power_law_1.2,0.08402559757232667
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,6144,2560,8,160,32,8,power_law_1.2,0.09159039855003356
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,6144,2560,8,160,32,8,power_law_1.2,0.10238720178604126
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,6144,2560,8,160,32,8,power_law_1.2,0.11905920505523682
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,6144,2560,8,160,32,8,power_law_1.2,0.1270848035812378
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,6144,2560,8,160,32,8,power_law_1.2,0.1731328010559082
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,6144,2560,8,160,32,8,power_law_1.2,0.19685759544372558
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,6144,2560,8,160,32,8,power_law_1.2,0.25960960388183596
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,6144,2560,8,160,32,8,power_law_1.2,0.31032960414886473
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,6144,2560,8,160,32,8,power_law_1.2,0.4725632190704346
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,7168,2048,8,384,2,128,balanced,0.11293866237004598
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,6144,2560,8,160,32,8,power_law_1.2,0.6211711883544921
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,7168,2048,8,384,2,128,balanced,0.11161599556605022
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,6144,2560,8,160,32,8,power_law_1.2,0.8401344299316407
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,7168,2048,8,384,2,128,balanced,0.11500799655914307
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,7168,2048,8,384,2,128,balanced,0.11760000387827556
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,6144,2560,8,160,32,8,power_law_1.2,1.0903743743896483
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,7168,2048,8,384,2,128,balanced,0.11852799852689107
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,6144,2560,8,160,32,8,power_law_1.2,1.4217599868774413
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,7168,2048,8,384,2,128,balanced,0.20086934169133505
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,7168,2048,8,384,2,128,balanced,0.28359999259312946
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,6144,2560,8,160,32,8,power_law_1.2,2.5530111312866213
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,7168,2048,8,384,2,128,balanced,0.2812959949175517
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,7168,2048,8,384,2,128,balanced,0.07690666615962982
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,7168,2048,8,384,2,128,balanced,0.28567999601364136
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,7168,2048,8,384,2,128,balanced,0.0787360022465388
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,6144,2560,8,160,32,8,power_law_1.2,5.326540756225586
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,7168,2048,8,384,2,128,balanced,0.08004799981911977
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,7168,2048,8,384,2,128,balanced,0.28723732630411786
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,7168,2048,8,384,2,128,balanced,0.08117866516113281
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,7168,2048,8,384,2,128,balanced,0.2879679997762044
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,7168,2048,8,384,2,128,balanced,0.07960000137488048
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,7168,2048,8,384,2,128,balanced,0.12436266740163167
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,7168,2048,8,384,2,128,balanced,0.2905866702397664
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,7168,2048,8,384,2,128,balanced,0.16668800512949625
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,7168,2048,8,384,2,128,balanced,0.17385067542394003
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,7168,2048,8,384,2,128,balanced,0.2834879954655965
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,7168,2048,8,384,2,128,balanced,0.1779786745707194
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,7168,2048,8,384,2,128,balanced,0.30055999755859375
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,7168,2048,8,384,2,128,balanced,0.17439999183019003
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,7168,2048,8,384,2,128,balanced,0.183296004931132
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,7168,2048,8,384,2,128,balanced,0.2840320070584615
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,7168,2048,8,384,2,128,balanced,0.17361599206924438
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,7168,2048,8,384,2,128,balanced,0.2804960012435913
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,7168,2048,8,384,2,128,balanced,0.17271467049916586
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,7168,2048,8,384,2,128,balanced,0.1829920013745626
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,7168,2048,8,384,2,128,balanced,0.2914560039838155
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,7168,2048,8,384,2,128,balanced,0.18266665935516357
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,7168,2048,8,384,2,128,balanced,0.18729066848754883
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,7168,2048,8,384,2,128,balanced,0.2974986632664998
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,7168,2048,8,384,2,128,balanced,0.18914665778477988
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,7168,2048,8,384,2,128,balanced,0.29809067646662396
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,7168,2048,8,384,2,128,balanced,0.04457599918047587
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,7168,2048,8,384,2,128,balanced,0.19194666544596353
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,7168,2048,8,384,2,128,balanced,0.2978293299674988
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,7168,2048,8,384,2,128,balanced,0.04539200166861216
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,7168,2048,8,384,2,128,balanced,0.20038400093714395
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,7168,2048,8,384,2,128,balanced,0.04520533482233683
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,7168,2048,8,384,2,128,balanced,0.22532800833384195
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,7168,2048,8,384,2,128,balanced,0.3128053347269694
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,7168,2048,8,384,2,128,balanced,0.04789333542188009
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,7168,2048,8,384,2,128,balanced,0.04811733464399973
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,7168,2048,8,384,2,128,balanced,0.24621333678563437
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,7168,2048,8,384,2,128,balanced,0.05487466851870219
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,7168,2048,8,384,2,128,balanced,0.31918400526046753
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,7168,2048,8,384,2,128,balanced,0.06333866715431213
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,7168,2048,8,384,2,128,balanced,0.27271467447280884
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,7168,2048,8,384,2,128,balanced,0.06380266447861989
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,7168,2048,8,384,2,128,balanced,0.06439466774463654
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,7168,2048,8,384,2,128,balanced,0.06434133152167003
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,7168,2048,8,384,2,128,balanced,0.3119306763013204
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,7168,2048,8,384,2,128,balanced,0.3035893241564433
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,7168,2048,8,384,2,128,balanced,0.06622399886449178
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,7168,2048,8,384,2,128,balanced,0.06657599906126659
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,7168,2048,8,384,2,128,balanced,0.06830400228500366
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,7168,2048,8,384,2,128,balanced,0.06913599868615468
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,7168,2048,8,384,2,128,balanced,0.305893341700236
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,7168,2048,8,384,2,128,balanced,0.35542933146158856
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,7168,2048,8,384,2,128,balanced,0.0745119998852412
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,7168,2048,8,384,2,128,balanced,0.07520533104737599
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,7168,2048,8,384,2,128,balanced,0.07969066500663757
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,7168,2048,8,384,2,128,balanced,0.5415680011113485
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,7168,2048,8,384,2,128,balanced,0.5692160129547119
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,7168,2048,8,384,2,128,balanced,0.08830400307973225
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,7168,2048,8,384,2,128,power_law_1.01,0.1716096043586731
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,384,2,128,balanced,0.0992746651172638
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,7168,2048,8,384,2,128,power_law_1.01,0.276908802986145
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,7168,2048,8,384,2,128,power_law_1.01,0.1739967942237854
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,7168,2048,8,384,2,128,power_law_1.01,0.2807807922363281
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,7168,2048,8,384,2,128,balanced,0.6519680023193359
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,7168,2048,8,384,2,128,power_law_1.01,0.16707199811935425
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,7168,2048,8,384,2,128,balanced,0.5562666654586792
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,7168,2048,8,384,2,128,power_law_1.01,0.287987208366394
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,7168,2048,8,384,2,128,power_law_1.01,0.1257599949836731
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,7168,2048,8,384,2,128,power_law_1.01,0.19388799667358397
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,7168,2048,8,384,2,128,power_law_1.01,0.14767359495162963
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,384,2,128,balanced,0.11639466881752014
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,7168,2048,8,384,2,128,power_law_1.01,0.21489279270172118
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,7168,2048,8,384,2,128,power_law_1.01,0.15199359655380248
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,7168,2048,8,384,2,128,power_law_1.01,0.15576319694519042
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,7168,2048,8,384,2,128,power_law_1.01,0.27268478870391843
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,384,2,128,balanced,0.13124799728393555
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,7168,2048,8,384,2,128,power_law_1.01,0.26874239444732667
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,7168,2048,8,384,2,128,power_law_1.01,0.1565440058708191
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,7168,2048,8,384,2,128,balanced,0.8962559700012207
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,7168,2048,8,384,2,128,power_law_1.01,0.17898240089416503
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,7168,2048,8,384,2,128,power_law_1.01,0.22771201133728028
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,7168,2048,8,384,2,128,power_law_1.01,0.05867519974708557
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,384,2,128,balanced,0.16214399536450705
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,7168,2048,8,384,2,128,balanced,0.8259413242340088
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,7168,2048,8,384,2,128,power_law_1.01,0.17269760370254517
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,7168,2048,8,384,2,128,power_law_1.01,0.27546238899230957
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,7168,2048,8,384,2,128,power_law_1.01,0.056601601839065555
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,7168,2048,8,384,2,128,power_law_1.01,0.15123200416564941
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,7168,2048,8,384,2,128,power_law_1.01,0.28117759227752687
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,7168,2048,8,384,2,128,power_law_1.01,0.05539199709892273
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,7168,2048,8,384,2,128,power_law_1.01,0.17003519535064698
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,7168,2048,8,384,2,128,power_law_1.01,0.27922561168670657
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,7168,2048,8,384,2,128,power_law_1.01,0.055174398422241214
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,7168,2048,8,384,2,128,power_law_1.01,0.17061760425567626
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,7168,2048,8,384,2,128,power_law_1.01,0.2624255895614624
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,7168,2048,8,384,2,128,power_law_1.01,0.05717759728431702
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,7168,2048,8,384,2,128,power_law_1.01,0.17122559547424315
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,7168,2048,8,384,2,128,power_law_1.01,0.27390079498291015
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,7168,2048,8,384,2,128,power_law_1.01,0.06072319746017456
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,384,2,128,balanced,0.1962133248647054
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,7168,2048,8,384,2,128,power_law_1.01,0.15267200469970704
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,7168,2048,8,384,2,128,power_law_1.01,0.2726464033126831
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,7168,2048,8,384,2,128,balanced,1.1354026794433594
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,7168,2048,8,384,2,128,power_law_1.01,0.05649920105934143
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,7168,2048,8,384,2,128,power_law_1.01,0.1711743950843811
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,7168,2048,8,384,2,128,power_law_1.01,0.2565567970275879
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,7168,2048,8,384,2,128,power_law_1.01,0.06350719928741455
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,7168,2048,8,384,2,128,balanced,1.0900906721750896
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,7168,2048,8,384,2,128,power_law_1.01,0.1627135992050171
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,7168,2048,8,384,2,128,power_law_1.01,0.2787584066390991
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,384,2,128,balanced,0.25412267446517944
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,7168,2048,8,384,2,128,power_law_1.01,0.06312320232391358
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,7168,2048,8,384,2,128,power_law_1.01,0.17276159524917603
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,7168,2048,8,384,2,128,power_law_1.01,0.24471681118011473
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,7168,2048,8,384,2,128,power_law_1.01,0.061791998147964475
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,7168,2048,8,384,2,128,power_law_1.01,0.18772480487823487
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,7168,2048,8,384,2,128,power_law_1.01,0.2499840021133423
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,7168,2048,8,384,2,128,power_law_1.01,0.061363202333450315
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,7168,2048,8,384,2,128,power_law_1.01,0.24138240814208983
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,7168,2048,8,384,2,128,power_law_1.01,0.25352959632873534
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,7168,2048,8,384,2,128,power_law_1.01,0.06669440269470214
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,7168,2048,8,384,2,128,power_law_1.01,0.28120319843292235
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,7168,2048,8,384,2,128,power_law_1.01,0.35148799419403076
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,7168,2048,8,384,2,128,power_law_1.01,0.06785280108451844
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,7168,2048,8,384,2,128,power_law_1.01,0.3387840032577515
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,7168,2048,8,384,2,128,power_law_1.01,0.35905280113220217
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,7168,2048,8,384,2,128,power_law_1.01,0.072326397895813
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,7168,2048,8,384,2,128,power_law_1.01,0.4341695785522461
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,7168,2048,8,384,2,128,power_law_1.01,0.4879936218261719
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,7168,2048,8,384,2,128,power_law_1.01,0.07861760258674622
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,7168,2048,8,384,2,128,power_law_1.01,0.6260543823242187
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,7168,2048,8,384,2,128,power_law_1.01,0.5875072002410888
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,7168,2048,8,384,2,128,power_law_1.01,0.08461440205574036
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,384,2,128,balanced,0.32579199473063153
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,7168,2048,8,384,2,128,power_law_1.01,0.8269439697265625
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,7168,2048,8,384,2,128,power_law_1.01,0.09510400295257568
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,7168,2048,8,384,2,128,power_law_1.01,0.844217586517334
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,7168,2048,8,384,2,128,balanced,1.7380693753560383
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,7168,2048,8,384,2,128,power_law_1.01,1.1683008193969726
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,7168,2048,8,384,2,128,power_law_1.01,0.10875519514083862
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,7168,2048,8,384,2,128,power_law_1.01,1.0514944076538086
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,7168,2048,8,384,2,128,power_law_1.01,1.5347519874572755
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,7168,2048,8,384,2,128,balanced,1.6125866572062175
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,7168,2048,8,384,2,128,power_law_1.2,0.2776832103729248
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,7168,2048,8,384,2,128,power_law_1.01,1.6317056655883788
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,384,2,128,power_law_1.01,0.1372480034828186
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,7168,2048,8,384,2,128,power_law_1.01,2.0050432205200197
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,7168,2048,8,384,2,128,power_law_1.2,0.2785599946975708
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,7168,2048,8,384,2,128,power_law_1.01,1.9718208312988281
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,384,2,128,balanced,0.44627734025319415
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,7168,2048,8,384,2,128,power_law_1.2,0.2478208065032959
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,7168,2048,8,384,2,128,power_law_1.01,3.0496448516845702
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,7168,2048,8,384,2,128,power_law_1.01,2.4941312789916994
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,384,2,128,power_law_1.01,0.1588863968849182
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,7168,2048,8,384,2,128,power_law_1.2,0.19411840438842773
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,384,2,128,power_law_1.01,0.18827519416809083
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,7168,2048,8,384,2,128,power_law_1.01,3.9707775115966797
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,7168,2048,8,384,2,128,power_law_1.2,0.21778559684753418
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,7168,2048,8,384,2,128,power_law_1.01,6.514335632324219
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,384,2,128,power_law_1.01,0.24490880966186523
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,7168,2048,8,384,2,128,power_law_1.2,0.2517568111419678
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,7168,2048,8,384,2,128,power_law_1.01,8.069158172607422
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,7168,2048,8,384,2,128,power_law_1.2,0.25333120822906496
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,384,2,128,power_law_1.01,0.3082240104675293
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,7168,2048,8,384,2,128,power_law_1.2,0.24371840953826904
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,7168,2048,8,384,2,128,power_law_1.2,0.28387200832366943
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,384,2,128,power_law_1.01,0.4295807838439941
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,7168,2048,8,384,2,128,power_law_1.2,0.250547194480896
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,384,2,128,balanced,0.5864266554514567
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,7168,2048,8,384,2,128,power_law_1.2,0.2816384077072144
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,384,2,128,power_law_1.01,0.5302656173706055
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,7168,2048,8,384,2,128,power_law_1.2,0.24910080432891846
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,384,2,128,power_law_1.01,0.844320011138916
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,7168,2048,8,384,2,128,power_law_1.2,0.26538240909576416
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,7168,2048,8,384,2,128,power_law_1.2,0.2572736024856567
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,384,2,128,power_law_1.01,1.0172608375549317
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,7168,2048,8,384,2,128,power_law_1.2,0.17106560468673707
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,7168,2048,8,384,2,128,power_law_1.2,0.2707135915756226
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,384,2,128,power_law_1.01,1.199673557281494
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,7168,2048,8,384,2,128,power_law_1.2,0.17233279943466187
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,7168,2048,8,384,2,128,power_law_1.2,0.23340799808502197
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,7168,2048,8,384,2,128,power_law_1.2,0.15882240533828734
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,384,2,128,power_law_1.01,2.1192447662353517
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,384,2,128,balanced,0.72270401318868
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,7168,2048,8,384,2,128,power_law_1.2,0.11907839775085449
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,7168,2048,8,384,2,128,power_law_1.2,0.24068479537963866
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,384,2,128,power_law_1.01,4.092454528808593
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,7168,2048,8,384,2,128,power_law_1.2,0.13162879943847655
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,7168,2048,8,384,2,128,power_law_1.2,0.2705535888671875
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,7168,2048,8,384,2,128,balanced,3.330992062886556
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,7168,2048,8,384,2,128,power_law_1.2,0.15283199548721313
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,7168,2048,8,384,2,128,power_law_1.2,0.3148672103881836
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,7168,2048,8,384,2,128,power_law_1.2,0.3724544048309326
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,7168,2048,8,384,2,128,power_law_1.2,0.14991999864578248
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,7168,2048,8,384,2,128,balanced,2.9533653259277344
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,7168,2048,8,384,2,128,power_law_1.2,0.46647038459777834
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,7168,2048,8,384,2,128,power_law_1.2,0.16042879819869996
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,7168,2048,8,384,2,128,power_law_1.2,0.5964159965515137
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,7168,2048,8,384,2,128,power_law_1.2,0.17382400035858153
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,7168,2048,8,384,2,128,power_law_1.2,0.7462592124938965
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,7168,2048,8,384,2,128,power_law_1.2,0.16432000398635865
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,7168,2048,8,384,2,128,power_law_1.2,1.0922112464904785
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,7168,2048,8,384,2,128,power_law_1.2,0.16486400365829468
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,7168,2048,8,384,2,128,power_law_1.2,1.3367487907409668
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,7168,2048,8,384,2,128,power_law_1.2,0.1605568051338196
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,7168,2048,8,384,2,128,power_law_1.2,1.9506752014160156
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,384,2,128,balanced,1.1292373339335124
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,7168,2048,8,384,2,128,power_law_1.2,0.16428159475326537
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,7168,2048,8,384,2,128,power_law_1.2,2.7893440246582033
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,7168,2048,8,384,2,128,power_law_1.2,0.1708672046661377
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,7168,2048,8,384,2,128,power_law_1.2,0.1686784029006958
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,7168,2048,8,384,2,128,power_law_1.2,3.9992385864257813
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,7168,2048,8,384,2,128,power_law_1.2,0.1635200023651123
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,7168,2048,8,384,2,128,power_law_1.2,6.621279907226563
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,7168,2048,8,384,2,128,power_law_1.2,0.15697920322418213
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,7168,2048,8,384,2,128,power_law_1.2,0.1928063988685608
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,7168,2048,8,384,2,128,power_law_1.2,13.265113830566406
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,7168,2048,8,384,2,128,power_law_1.2,0.1985152006149292
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,7168,2048,8,384,2,128,power_law_1.2,0.2868544101715088
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,7168,2048,8,384,2,128,power_law_1.2,0.30352001190185546
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,7168,2048,8,384,2,128,power_law_1.2,0.4374591827392578
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,7168,2048,8,384,2,128,power_law_1.2,0.5621952056884766
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,7168,2048,8,384,2,128,power_law_1.2,0.78023681640625
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,7168,2048,8,384,2,128,power_law_1.2,0.9825728416442872
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,7168,2048,8,384,2,128,power_law_1.2,1.4346495628356934
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,7168,2048,8,384,2,128,power_law_1.2,1.9484159469604492
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,7168,2048,8,384,2,128,power_law_1.2,2.515635108947754
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,7168,2048,8,384,2,128,power_law_1.2,4.2293952941894535
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,384,2,128,balanced,2.230405330657959
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,7168,2048,8,384,2,128,power_law_1.2,9.869452667236327
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,7168,2048,8,384,4,64,balanced,0.09518399834632874
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,7168,2048,8,384,4,64,balanced,0.0930560032526652
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,7168,2048,8,384,4,64,balanced,0.09698667128880818
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,7168,2048,8,384,2,128,power_law_1.2,0.05878400206565857
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,7168,2048,8,384,4,64,balanced,0.09872532884279887
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,7168,2048,8,384,4,64,balanced,0.12218667070070903
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,7168,2048,8,384,2,128,power_law_1.2,0.05626239776611328
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,7168,2048,8,384,4,64,balanced,0.18970666329065958
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,7168,2048,8,384,2,128,power_law_1.2,0.05448960065841675
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,7168,2048,8,384,4,64,balanced,0.2899786631266276
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,7168,2048,8,384,2,128,power_law_1.2,0.05242879986763001
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,7168,2048,8,384,4,64,balanced,0.2727359930674235
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,7168,2048,8,384,2,128,power_law_1.2,0.058329600095748904
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,7168,2048,8,384,4,64,balanced,0.28539733091990155
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,7168,2048,8,384,4,64,balanced,0.2975306709607442
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,7168,2048,8,384,2,128,power_law_1.2,0.059654402732849124
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,7168,2048,8,384,4,64,balanced,0.28334933519363403
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,7168,2048,8,384,2,128,power_law_1.2,0.05729280114173889
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,7168,2048,8,384,4,64,balanced,0.2699306607246399
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,7168,2048,8,384,2,128,power_law_1.2,0.06334720253944397
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,7168,2048,8,384,4,64,balanced,0.064751997590065
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,7168,2048,8,384,4,64,balanced,0.3113600015640259
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,7168,2048,8,384,2,128,power_law_1.2,0.06024320125579834
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,7168,2048,8,384,4,64,balanced,0.06489066779613495
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,7168,2048,8,384,4,64,balanced,0.28490134080251056
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,7168,2048,8,384,2,128,power_law_1.2,0.06439679861068726
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,7168,2048,8,384,4,64,balanced,0.06470933556556702
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,7168,2048,8,384,4,64,balanced,0.2794506748517354
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,7168,2048,8,384,4,64,balanced,0.06763199965159099
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,7168,2048,8,384,2,128,power_law_1.2,0.06510720252990723
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,7168,2048,8,384,4,64,balanced,0.08390399813652039
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,7168,2048,8,384,4,64,balanced,0.2948053280512492
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,7168,2048,8,384,2,128,power_law_1.2,0.06720640063285828
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,7168,2048,8,384,4,64,balanced,0.12931733330090842
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,7168,2048,8,384,4,64,balanced,0.2775680025418599
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,7168,2048,8,384,4,64,balanced,0.17137600978215536
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,7168,2048,8,384,2,128,power_law_1.2,0.06931840181350708
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,7168,2048,8,384,4,64,balanced,0.17634665966033936
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,7168,2048,8,384,4,64,balanced,0.29064534107844037
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,7168,2048,8,384,2,128,power_law_1.2,0.07089279890060425
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,7168,2048,8,384,4,64,balanced,0.1760586698849996
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,7168,2048,8,384,4,64,power_law_1.01,0.28041601181030273
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,7168,2048,8,384,4,64,balanced,0.2866453329722087
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,7168,2048,8,384,4,64,balanced,0.17734932899475098
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,7168,2048,8,384,2,128,power_law_1.2,0.07906559705734253
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,7168,2048,8,384,4,64,power_law_1.01,0.2818943977355957
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,7168,2048,8,384,4,64,balanced,0.17919466892878214
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,7168,2048,8,384,2,128,power_law_1.2,0.09253759980201721
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,7168,2048,8,384,4,64,balanced,0.043824002146720886
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,7168,2048,8,384,4,64,balanced,0.30370134115219116
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,7168,2048,8,384,4,64,balanced,0.15954666336377463
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,7168,2048,8,384,4,64,power_law_1.01,0.2823424100875854
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,7168,2048,8,384,2,128,power_law_1.2,0.09708160161972046
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,7168,2048,8,384,4,64,balanced,0.04466133316357931
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,7168,2048,8,384,4,64,balanced,0.1851573387781779
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,7168,2048,8,384,4,64,power_law_1.01,0.1472383975982666
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,7168,2048,8,384,4,64,balanced,0.29546666145324707
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,7168,2048,8,384,4,64,balanced,0.044735997915267944
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,7168,2048,8,384,2,128,power_law_1.2,0.11859840154647827
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,7168,2048,8,384,4,64,balanced,0.17038400967915854
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,7168,2048,8,384,4,64,power_law_1.01,0.1950144052505493
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,7168,2048,8,384,4,64,balanced,0.04761599997679392
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,7168,2048,8,384,4,64,balanced,0.19008000691731772
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,7168,2048,8,384,4,64,power_law_1.01,0.24851839542388915
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,7168,2048,8,384,4,64,balanced,0.048437332113583885
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,7168,2048,8,384,4,64,balanced,0.3117813269297282
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,384,2,128,power_law_1.2,0.1350335955619812
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,7168,2048,8,384,4,64,balanced,0.18874667088190714
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,7168,2048,8,384,4,64,power_law_1.01,0.21190400123596193
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,7168,2048,8,384,4,64,balanced,0.05499200026194254
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,7168,2048,8,384,4,64,balanced,0.1897760033607483
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,7168,2048,8,384,4,64,power_law_1.01,0.2503423929214478
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,7168,2048,8,384,4,64,balanced,0.0634986658891042
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,7168,2048,8,384,4,64,balanced,0.2002613345781962
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,7168,2048,8,384,4,64,balanced,0.3151893417040507
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,384,2,128,power_law_1.2,0.17408640384674073
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,7168,2048,8,384,4,64,balanced,0.06450133522351582
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,7168,2048,8,384,4,64,power_law_1.01,0.2647167921066284
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,7168,2048,8,384,4,64,balanced,0.20570667584737143
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,7168,2048,8,384,4,64,balanced,0.06442666550477345
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,7168,2048,8,384,4,64,power_law_1.01,0.2596415996551514
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,384,2,128,power_law_1.2,0.205401611328125
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,7168,2048,8,384,4,64,balanced,0.0651093324025472
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,7168,2048,8,384,4,64,balanced,0.22086399793624878
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,7168,2048,8,384,4,64,power_law_1.01,0.2752320051193237
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,384,2,128,power_law_1.2,0.3034303903579712
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,7168,2048,8,384,4,64,balanced,0.0662613312403361
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,7168,2048,8,384,4,64,balanced,0.3209386666615804
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,7168,2048,8,384,4,64,power_law_1.01,0.2527231931686401
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,7168,2048,8,384,4,64,balanced,0.24241065979003906
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,7168,2048,8,384,4,64,balanced,0.06804266571998596
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,7168,2048,8,384,4,64,power_law_1.01,0.2726912021636963
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,7168,2048,8,384,4,64,power_law_1.01,0.17179520130157472
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,7168,2048,8,384,4,64,balanced,0.06922133266925812
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,384,2,128,power_law_1.2,0.4002367973327637
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,7168,2048,8,384,4,64,power_law_1.01,0.262009596824646
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,7168,2048,8,384,4,64,balanced,0.27482134103775024
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,7168,2048,8,384,4,64,balanced,0.06962133447329204
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,384,2,128,power_law_1.2,0.5253824234008789
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,7168,2048,8,384,4,64,power_law_1.01,0.1631999969482422
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,7168,2048,8,384,4,64,power_law_1.01,0.25864319801330565
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,7168,2048,8,384,4,64,balanced,0.61407999197642
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,7168,2048,8,384,4,64,balanced,0.07600000003973643
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,7168,2048,8,384,4,64,power_law_1.01,0.18067840337753296
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,7168,2048,8,384,4,64,power_law_1.01,0.2758336067199707
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,7168,2048,8,384,4,64,balanced,0.07638933261235555
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,7168,2048,8,384,4,64,balanced,0.30346133311589557
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,7168,2048,8,384,4,64,power_law_1.01,0.2599168062210083
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,7168,2048,8,384,4,64,power_law_1.01,0.10065920352935791
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,384,2,128,power_law_1.2,0.6354559898376465
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,7168,2048,8,384,4,64,balanced,0.0810346653064092
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,7168,2048,8,384,4,64,power_law_1.01,0.25917439460754393
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,7168,2048,8,384,4,64,power_law_1.01,0.13349119424819947
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,384,2,128,power_law_1.2,1.0515199661254884
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,7168,2048,8,384,4,64,balanced,0.09027733405431111
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,7168,2048,8,384,4,64,power_law_1.01,0.26835200786590574
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,7168,2048,8,384,4,64,balanced,0.3681600093841553
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,7168,2048,8,384,4,64,power_law_1.01,0.133951997756958
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,7168,2048,8,384,4,64,power_law_1.01,0.34163200855255127
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,7168,2048,8,384,4,64,power_law_1.01,0.14562560319900514
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,7168,2048,8,384,4,64,balanced,0.5842080116271973
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,384,2,128,power_law_1.2,1.3835071563720702
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,7168,2048,8,384,4,64,power_law_1.01,0.3740288019180298
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,384,4,64,balanced,0.09961066643397014
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,7168,2048,8,384,4,64,power_law_1.01,0.1583359956741333
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,384,2,128,power_law_1.2,1.8301759719848634
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,7168,2048,8,384,4,64,power_law_1.01,0.4785855770111084
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,7168,2048,8,384,4,64,power_law_1.01,0.16397440433502197
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,7168,2048,8,384,4,64,balanced,0.5646773179372152
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,7168,2048,8,384,4,64,power_law_1.01,0.5812416076660156
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,384,2,128,power_law_1.2,3.2759361267089844
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,7168,2048,8,384,4,64,power_law_1.01,0.15674240589141847
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,7168,2048,8,384,4,64,power_law_1.01,0.7898880004882812
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,7168,2048,8,384,4,64,power_law_1.01,0.16822400093078613
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,384,2,128,power_law_1.2,5.520479965209961
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,7168,2048,8,384,4,64,power_law_1.01,0.8857983589172364
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,7168,2048,8,384,4,64,power_law_1.01,0.14640640020370482
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,384,4,64,balanced,0.12052800258000691
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,7168,2048,8,384,4,64,power_law_1.01,1.3254207611083983
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,7168,2048,8,384,4,64,power_law_1.01,0.1820799946784973
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,7168,2048,8,384,4,64,balanced,0.8644266923268636
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,7168,2048,8,384,4,64,power_law_1.01,0.062457597255706786
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,384,4,64,balanced,0.13781866431236267
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,7168,2048,8,384,4,64,balanced,0.6790880362192789
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,7168,2048,8,384,4,64,power_law_1.01,1.7316160202026367
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,7168,2048,8,384,4,64,power_law_1.01,0.16636799573898314
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,7168,2048,8,384,4,64,power_law_1.01,0.058899199962615965
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,7168,2048,8,384,4,64,power_law_1.01,2.0800960540771483
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,7168,2048,8,384,4,64,power_law_1.01,0.16813440322875978
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,7168,2048,8,384,4,64,power_law_1.01,0.05763840079307556
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,384,4,64,balanced,0.16894400119781494
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,7168,2048,8,384,4,64,power_law_1.01,0.05220479965209961
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,7168,2048,8,384,4,64,power_law_1.01,0.17485439777374268
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,7168,2048,8,384,4,64,power_law_1.01,3.202323150634766
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,7168,2048,8,384,4,64,power_law_1.01,0.054655998945236206
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,7168,2048,8,384,4,64,power_law_1.01,0.16919039487838744
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,7168,2048,8,384,4,64,power_law_1.01,0.056806397438049314
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,7168,2048,8,384,4,64,power_law_1.2,0.2772608041763306
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,7168,2048,8,384,4,64,power_law_1.01,7.778150177001953
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,7168,2048,8,384,4,64,power_law_1.01,0.0597760021686554
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,7168,2048,8,384,4,64,power_law_1.01,0.18744319677352905
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,7168,2048,8,384,4,64,power_law_1.01,0.06257280111312866
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,7168,2048,8,384,4,64,power_law_1.2,0.2768383979797363
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,7168,2048,8,384,4,64,power_law_1.01,0.19853440523147584
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,7168,2048,8,384,4,64,balanced,0.9270559946695963
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,7168,2048,8,384,4,64,power_law_1.01,0.0652288019657135
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,7168,2048,8,384,4,64,power_law_1.2,0.27444479465484617
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,7168,2048,8,384,4,64,power_law_1.01,0.06453120112419128
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,7168,2048,8,384,4,64,power_law_1.01,0.2529151916503906
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,7168,2048,8,384,4,64,balanced,1.184869368871053
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,384,4,64,balanced,0.20758932828903198
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,7168,2048,8,384,4,64,power_law_1.01,0.06386560201644897
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,7168,2048,8,384,4,64,power_law_1.2,0.13519359827041627
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,7168,2048,8,384,4,64,power_law_1.01,0.2871936082839966
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,7168,2048,8,384,4,64,power_law_1.01,0.06908800005912781
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,7168,2048,8,384,4,64,power_law_1.2,0.20367999076843263
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,7168,2048,8,384,4,64,power_law_1.01,0.07035520076751708
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,7168,2048,8,384,4,64,power_law_1.01,0.36551039218902587
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,7168,2048,8,384,4,64,power_law_1.2,0.1752128005027771
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,7168,2048,8,384,4,64,power_law_1.01,0.07279999852180481
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,384,4,64,balanced,0.268778661886851
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,7168,2048,8,384,4,64,power_law_1.01,0.4439743995666504
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,7168,2048,8,384,4,64,power_law_1.01,0.07924479842185975
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,7168,2048,8,384,4,64,power_law_1.2,0.21916799545288085
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,7168,2048,8,384,4,64,power_law_1.01,0.08290560245513916
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,7168,2048,8,384,4,64,power_law_1.01,0.6227071762084961
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,7168,2048,8,384,4,64,power_law_1.2,0.25201280117034913
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,7168,2048,8,384,4,64,power_law_1.01,0.0886784017086029
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,7168,2048,8,384,4,64,power_law_1.2,0.2465536117553711
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,7168,2048,8,384,4,64,power_law_1.01,0.7594880104064942
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,7168,2048,8,384,4,64,power_law_1.01,0.11219199895858764
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,7168,2048,8,384,4,64,balanced,1.2098399798075359
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,7168,2048,8,384,4,64,power_law_1.2,0.2640320062637329
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,7168,2048,8,384,4,64,power_law_1.01,1.0517696380615233
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,384,4,64,power_law_1.01,0.12617599964141846
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,7168,2048,8,384,4,64,power_law_1.2,0.23322880268096924
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,7168,2048,8,384,4,64,power_law_1.01,1.38722562789917
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,384,4,64,balanced,0.3474080165227254
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,7168,2048,8,384,4,64,power_law_1.2,0.25859200954437256
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,384,4,64,power_law_1.01,0.15404160022735597
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,7168,2048,8,384,4,64,power_law_1.01,1.944646453857422
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,7168,2048,8,384,4,64,power_law_1.2,0.2619712114334106
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,384,4,64,power_law_1.01,0.18404480218887329
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,7168,2048,8,384,4,64,power_law_1.01,2.8334272384643553
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,384,4,64,power_law_1.01,0.2464128017425537
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,7168,2048,8,384,4,64,power_law_1.2,0.21928319931030274
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,7168,2048,8,384,4,64,balanced,1.7231680552164714
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,7168,2048,8,384,4,64,power_law_1.2,0.2510848045349121
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,7168,2048,8,384,4,64,power_law_1.01,5.8631233215332035
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,7168,2048,8,384,4,64,power_law_1.2,0.24773120880126953
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,384,4,64,power_law_1.01,0.2870847940444946
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,384,4,64,balanced,0.4833120107650757
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,384,4,64,power_law_1.01,0.41455998420715334
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,7168,2048,8,384,4,64,power_law_1.2,0.23361918926239014
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,7168,2048,8,384,4,64,power_law_1.2,0.2781183958053589
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,384,4,64,power_law_1.01,0.5766911983489991
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,7168,2048,8,384,4,64,power_law_1.2,0.31402881145477296
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,384,4,64,power_law_1.01,0.8284928321838378
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,7168,2048,8,384,4,64,balanced,1.823520024617513
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,7168,2048,8,384,4,64,power_law_1.2,0.35859200954437254
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,7168,2048,8,384,4,64,power_law_1.2,0.4291391849517822
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,384,4,64,power_law_1.01,1.1422080039978026
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,7168,2048,8,384,4,64,power_law_1.2,0.5283455848693848
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,384,4,64,balanced,0.6500746806462606
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,7168,2048,8,384,4,64,power_law_1.2,0.7256639957427978
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,384,4,64,power_law_1.01,1.3944128036499024
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,7168,2048,8,384,4,64,power_law_1.2,0.9617792129516601
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,7168,2048,8,384,4,64,power_law_1.2,1.3035008430480957
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,384,4,64,power_law_1.01,1.9560319900512695
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,7168,2048,8,384,4,64,power_law_1.2,1.6489984512329101
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,384,4,64,power_law_1.01,4.045292663574219
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,7168,2048,8,384,4,64,power_law_1.2,2.3546688079833986
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,7168,2048,8,384,4,64,power_law_1.2,3.1819839477539062
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,7168,2048,8,384,4,64,power_law_1.2,4.225088119506836
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,384,4,64,balanced,0.8087093035380045
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,7168,2048,8,384,4,64,power_law_1.2,9.435616302490235
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,7168,2048,8,384,4,64,balanced,3.1119521458943686
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,7168,2048,8,384,4,64,balanced,3.457866668701172
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,384,4,64,balanced,1.2667786280314128
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,7168,2048,8,384,4,64,power_law_1.2,0.1769600033760071
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,7168,2048,8,384,4,64,power_law_1.2,0.16745599508285522
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,7168,2048,8,384,4,64,power_law_1.2,0.16328959465026854
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,384,4,64,balanced,2.472218672434489
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,7168,2048,8,384,4,64,power_law_1.2,0.11338880062103271
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,7168,2048,8,384,4,64,power_law_1.2,0.10447360277175903
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,7168,2048,8,384,4,64,power_law_1.2,0.11776000261306763
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,7168,2048,8,384,4,64,power_law_1.2,0.12087680101394653
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,7168,2048,8,384,4,64,power_law_1.2,0.1590399980545044
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,7168,2048,8,384,4,64,power_law_1.2,0.12688640356063843
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,7168,2048,8,384,4,64,power_law_1.2,0.0627839982509613
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,7168,2048,8,384,4,64,power_law_1.2,0.1534656047821045
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,7168,2048,8,384,4,64,power_law_1.2,0.05877760052680969
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,7168,2048,8,384,4,64,power_law_1.2,0.1649791955947876
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,7168,2048,8,384,4,64,power_law_1.2,0.055641597509384154
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,7168,2048,8,384,4,64,power_law_1.2,0.15735679864883423
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,7168,2048,8,384,4,64,power_law_1.2,0.05294079780578613
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,7168,2048,8,384,4,64,power_law_1.2,0.17033599615097045
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,7168,2048,8,384,4,64,power_law_1.2,0.05451520085334778
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,7168,2048,8,384,4,64,power_law_1.2,0.16019200086593627
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,7168,2048,8,384,4,64,power_law_1.2,0.058361601829528806
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,7168,2048,8,384,4,64,power_law_1.2,0.17107199430465697
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,7168,2048,8,384,4,64,power_law_1.2,0.061273598670959474
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,7168,2048,8,384,4,64,power_law_1.2,0.17807359695434571
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,7168,2048,8,384,4,64,power_law_1.2,0.1842687964439392
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,7168,2048,8,384,4,64,power_law_1.2,0.06350719928741455
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,7168,2048,8,384,8,32,balanced,0.06432533264160156
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,7168,2048,8,384,4,64,power_law_1.2,0.06260480284690857
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,7168,2048,8,384,4,64,power_law_1.2,0.19169919490814208
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,7168,2048,8,384,8,32,balanced,0.06443200012048085
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,7168,2048,8,384,4,64,power_law_1.2,0.06362879872322083
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,7168,2048,8,384,4,64,power_law_1.2,0.20798079967498778
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,7168,2048,8,384,8,32,balanced,0.064410666624705
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,7168,2048,8,384,4,64,power_law_1.2,0.06616320013999939
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,7168,2048,8,384,4,64,power_law_1.2,0.2689471960067749
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,7168,2048,8,384,8,32,balanced,0.09742400050163269
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,7168,2048,8,384,4,64,power_law_1.2,0.06731520295143127
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,7168,2048,8,384,8,32,balanced,0.11887466907501221
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,7168,2048,8,384,4,64,power_law_1.2,0.30190720558166506
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,7168,2048,8,384,8,32,balanced,0.20149866739908853
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,7168,2048,8,384,4,64,power_law_1.2,0.070278400182724
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,7168,2048,8,384,4,64,power_law_1.2,0.42595839500427246
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,7168,2048,8,384,8,32,balanced,0.29810667037963867
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,7168,2048,8,384,4,64,power_law_1.2,0.07338240146636962
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,7168,2048,8,384,4,64,power_law_1.2,0.5078527927398682
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,7168,2048,8,384,8,32,balanced,0.2842400074005127
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,7168,2048,8,384,4,64,power_law_1.2,0.08239359855651855
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,7168,2048,8,384,8,32,balanced,0.264629324277242
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,7168,2048,8,384,4,64,power_law_1.2,0.6521920204162598
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,7168,2048,8,384,4,64,power_law_1.2,0.08494719862937927
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,7168,2048,8,384,8,32,balanced,0.2925279935201009
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,7168,2048,8,384,4,64,power_law_1.2,0.841062355041504
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,7168,2048,8,384,8,32,balanced,0.2925493319829305
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,7168,2048,8,384,4,64,power_law_1.2,0.09354879856109619
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,7168,2048,8,384,8,32,balanced,0.29174933830897015
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,7168,2048,8,384,4,64,power_law_1.2,1.272383975982666
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,7168,2048,8,384,4,64,power_law_1.2,0.11893119812011718
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,7168,2048,8,384,8,32,balanced,0.28844799598058063
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,7168,2048,8,384,4,64,power_law_1.2,1.6557439804077148
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,7168,2048,8,384,8,32,balanced,0.28012800216674805
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,7168,2048,8,384,8,32,balanced,0.05834133426348368
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,384,4,64,power_law_1.2,0.13934719562530518
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,7168,2048,8,384,8,32,balanced,0.27236799399058026
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,7168,2048,8,384,8,32,balanced,0.059418668349583946
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,7168,2048,8,384,4,64,power_law_1.2,2.1123584747314452
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,7168,2048,8,384,8,32,balanced,0.05952000121275584
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,7168,2048,8,384,8,32,balanced,0.2821013331413269
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,7168,2048,8,384,8,32,balanced,0.07027199864387512
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,7168,2048,8,384,4,64,power_law_1.2,3.47509765625
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,7168,2048,8,384,8,32,balanced,0.2775946656862895
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,7168,2048,8,384,8,32,balanced,0.08284266789754231
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,384,4,64,power_law_1.2,0.17488640546798706
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,7168,2048,8,384,8,32,balanced,0.13486933708190918
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,7168,2048,8,384,8,32,balanced,0.2913706700007121
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,7168,2048,8,384,8,32,balanced,0.17804799477259317
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,384,4,64,power_law_1.2,0.20547199249267578
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,7168,2048,8,384,4,64,power_law_1.2,7.050342559814453
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,7168,2048,8,384,8,32,balanced,0.179584006468455
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,7168,2048,8,384,8,32,balanced,0.28037865956624347
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,7168,2048,8,384,8,32,balanced,0.18242132663726807
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,384,4,64,power_law_1.2,0.2786880016326904
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,7168,2048,8,384,8,32,balanced,0.17918932437896729
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,7168,2048,8,384,8,32,balanced,0.3056959907213847
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,7168,2048,8,384,8,32,balanced,0.18069867293039957
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,7168,2048,8,384,8,32,balanced,0.1925706664721171
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,7168,2048,8,384,8,32,balanced,0.18345065911610922
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,7168,2048,8,384,8,32,balanced,0.30607465902964276
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,384,4,64,power_law_1.2,0.3794559955596924
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,7168,2048,8,384,8,32,balanced,0.18197333812713623
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,384,4,64,power_law_1.2,0.5595967769622803
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,7168,2048,8,384,8,32,balanced,0.18949333826700845
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,7168,2048,8,384,8,32,balanced,0.31709333260854083
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,7168,2048,8,384,8,32,balanced,0.18586132923762003
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,7168,2048,8,384,8,32,balanced,0.19638399283091226
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,384,4,64,power_law_1.2,0.6246719837188721
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,7168,2048,8,384,8,32,balanced,0.19885865847269693
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,7168,2048,8,384,8,32,balanced,0.32570133606592816
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,7168,2048,8,384,8,32,balanced,0.20880534251530966
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,384,4,64,power_law_1.2,1.0409279823303224
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,7168,2048,8,384,8,32,balanced,0.04472533365090688
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,7168,2048,8,384,8,32,balanced,0.22894400358200073
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,7168,2048,8,384,8,32,balanced,0.04523199796676636
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,384,4,64,power_law_1.2,1.330675220489502
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,7168,2048,8,384,8,32,balanced,0.24730666478474936
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,7168,2048,8,384,8,32,balanced,0.34671998023986816
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,7168,2048,8,384,8,32,power_law_1.01,0.2052608013153076
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,7168,2048,8,384,8,32,power_law_1.01,0.13544319868087767
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,7168,2048,8,384,8,32,balanced,0.04516266783078512
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,7168,2048,8,384,8,32,balanced,0.04930133124192556
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,7168,2048,8,384,8,32,balanced,0.2871413429578145
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,7168,2048,8,384,8,32,power_law_1.01,0.29015679359436036
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,7168,2048,8,384,8,32,power_law_1.01,0.18367999792099
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,384,4,64,power_law_1.2,1.7205312728881836
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,7168,2048,8,384,8,32,balanced,0.051407997806866966
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,7168,2048,8,384,8,32,power_law_1.01,0.301580810546875
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,7168,2048,8,384,8,32,power_law_1.01,0.18655359745025635
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,384,4,64,power_law_1.2,3.01779842376709
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,7168,2048,8,384,8,32,balanced,0.06053866446018219
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,7168,2048,8,384,8,32,balanced,0.3248800039291382
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,7168,2048,8,384,8,32,power_law_1.01,0.11406079530715943
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,7168,2048,8,384,8,32,power_law_1.01,0.08549119830131531
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,7168,2048,8,384,8,32,balanced,0.6142079830169678
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,7168,2048,8,384,8,32,balanced,0.06755200028419495
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,7168,2048,8,384,8,32,power_law_1.01,0.16826239824295045
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,7168,2048,8,384,8,32,power_law_1.01,0.11128319501876831
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,7168,2048,8,384,8,32,balanced,0.06955199937025706
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,384,4,64,power_law_1.2,5.9413505554199215
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,7168,2048,8,384,8,32,power_law_1.01,0.2205120086669922
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,7168,2048,8,384,8,32,balanced,0.06974933544794719
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,7168,2048,8,384,8,32,balanced,0.39630401134490967
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,7168,2048,8,384,8,32,power_law_1.01,0.13717759847640992
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,7168,2048,8,384,8,32,balanced,0.07007466753323872
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,7168,2048,8,384,8,32,power_law_1.01,0.19799040555953978
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,7168,2048,8,384,8,32,power_law_1.01,0.13025920391082763
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,7168,2048,8,384,8,32,balanced,0.0716480016708374
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,7168,2048,8,384,8,32,power_law_1.01,0.23804159164428712
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,7168,2048,8,384,8,32,power_law_1.01,0.15362559556961058
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,7168,2048,8,384,8,32,balanced,0.07292266686757405
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,7168,2048,8,384,8,32,balanced,0.6336426734924316
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,7168,2048,8,384,8,32,power_law_1.01,0.23069438934326172
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,7168,2048,8,384,8,32,balanced,0.5963253180185953
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,7168,2048,8,384,8,32,balanced,0.07442666590213776
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,7168,2048,8,384,8,32,power_law_1.01,0.15221760272979737
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,7168,2048,8,384,8,32,power_law_1.01,0.25684480667114257
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,7168,2048,8,384,8,32,balanced,0.075573335091273
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,7168,2048,8,384,8,32,power_law_1.01,0.17020800113677978
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,7168,2048,8,384,8,32,power_law_1.01,0.2543872117996216
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,7168,2048,8,384,8,32,balanced,0.08212266862392426
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,7168,2048,8,384,8,32,power_law_1.01,0.16139520406723024
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,7168,2048,8,384,8,32,power_law_1.01,0.26067841053009033
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,7168,2048,8,384,8,32,balanced,0.08318933347860973
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,7168,2048,8,384,8,32,power_law_1.01,0.1708032011985779
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,7168,2048,8,384,8,32,power_law_1.01,0.2538367986679077
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,7168,2048,8,384,8,32,balanced,0.08769067128499348
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,7168,2048,8,384,8,32,balanced,0.7299626668294271
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,7168,2048,8,384,8,32,power_law_1.01,0.1656000018119812
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,7168,2048,8,384,8,32,power_law_1.01,0.25939838886260985
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,7168,2048,8,384,8,32,balanced,0.09897067149480183
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,7168,2048,8,384,8,32,balanced,0.9335253238677979
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,7168,2048,8,384,8,32,power_law_1.01,0.16316159963607788
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,7168,2048,8,384,8,32,power_law_1.01,0.243833589553833
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,7168,2048,8,384,8,32,power_law_1.01,0.16531840562820435
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,7168,2048,8,384,8,32,power_law_1.01,0.2509376049041748
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,384,8,32,balanced,0.11378133296966553
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,7168,2048,8,384,8,32,power_law_1.01,0.25902719497680665
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,7168,2048,8,384,8,32,power_law_1.01,0.1785024046897888
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,7168,2048,8,384,8,32,power_law_1.01,0.2546880006790161
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,7168,2048,8,384,8,32,power_law_1.01,0.1796031951904297
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,7168,2048,8,384,8,32,power_law_1.01,0.29692161083221436
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,7168,2048,8,384,8,32,balanced,1.0008266766866047
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,7168,2048,8,384,8,32,power_law_1.01,0.1804927945137024
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,7168,2048,8,384,8,32,power_law_1.01,0.3147264003753662
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,7168,2048,8,384,8,32,power_law_1.01,0.20392959117889403
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,384,8,32,balanced,0.13433067003885904
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,7168,2048,8,384,8,32,power_law_1.01,0.3785919904708862
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,7168,2048,8,384,8,32,power_law_1.01,0.24917759895324706
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,7168,2048,8,384,8,32,balanced,1.2542933622996013
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,7168,2048,8,384,8,32,power_law_1.01,0.44071040153503416
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,384,8,32,balanced,0.15458133816719055
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,7168,2048,8,384,8,32,power_law_1.01,0.27895679473876955
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,7168,2048,8,384,8,32,power_law_1.01,0.5399424076080322
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,7168,2048,8,384,8,32,power_law_1.01,0.3642751932144165
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,384,8,32,balanced,0.18936532735824585
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,7168,2048,8,384,8,32,power_law_1.01,0.7008959770202636
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,7168,2048,8,384,8,32,power_law_1.01,0.43558402061462403
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,7168,2048,8,384,8,32,power_law_1.01,0.8889920234680175
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,7168,2048,8,384,8,32,power_law_1.01,0.5669375896453858
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,7168,2048,8,384,8,32,balanced,1.2804693380991619
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,7168,2048,8,384,8,32,power_law_1.01,1.2049216270446776
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,7168,2048,8,384,8,32,power_law_1.01,0.061299198865890504
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,7168,2048,8,384,8,32,power_law_1.01,0.7826432228088379
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,7168,2048,8,384,8,32,power_law_1.01,1.5112319946289063
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,7168,2048,8,384,8,32,power_law_1.01,0.06649600267410279
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,7168,2048,8,384,8,32,power_law_1.01,1.067103958129883
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,7168,2048,8,384,8,32,power_law_1.01,1.9369600296020508
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,384,8,32,balanced,0.2363040049870809
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,7168,2048,8,384,8,32,power_law_1.01,0.06265599727630615
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,7168,2048,8,384,8,32,power_law_1.01,1.3801024436950684
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,7168,2048,8,384,8,32,power_law_1.01,2.8066240310668946
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,7168,2048,8,384,8,32,power_law_1.01,0.052134400606155394
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,7168,2048,8,384,8,32,power_law_1.01,1.6468095779418945
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,7168,2048,8,384,8,32,power_law_1.01,0.05687040090560913
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,7168,2048,8,384,8,32,power_law_1.01,5.479359817504883
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,384,8,32,balanced,0.310810665289561
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,7168,2048,8,384,8,32,power_law_1.01,0.06047359704971313
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,7168,2048,8,384,8,32,power_law_1.01,2.6343807220458983
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,7168,2048,8,384,8,32,balanced,1.8414239883422852
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,7168,2048,8,384,8,32,power_law_1.01,0.061408001184463504
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,7168,2048,8,384,8,32,power_law_1.01,5.4858558654785154
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,7168,2048,8,384,8,32,power_law_1.01,0.06654080152511596
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,7168,2048,8,384,8,32,power_law_1.01,0.06751999855041504
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,7168,2048,8,384,8,32,power_law_1.01,0.06776959896087646
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,7168,2048,8,384,8,32,balanced,1.9563786188761394
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,7168,2048,8,384,8,32,power_law_1.01,0.06776319742202759
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,7168,2048,8,384,8,32,power_law_1.01,0.0735360026359558
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,384,8,32,balanced,0.41803733507792157
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,7168,2048,8,384,8,32,power_law_1.01,0.07444480061531067
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,7168,2048,8,384,8,32,power_law_1.01,0.07835519909858704
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,7168,2048,8,384,8,32,power_law_1.01,0.08758400082588196
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,7168,2048,8,384,8,32,power_law_1.01,0.09022719860076904
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,384,8,32,balanced,0.5962613423665365
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,7168,2048,8,384,8,32,power_law_1.01,0.09734399914741516
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,7168,2048,8,384,8,32,power_law_1.01,0.12380800247192383
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,384,8,32,power_law_1.01,0.13836159706115722
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,384,8,32,power_law_1.01,0.161900794506073
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,384,8,32,power_law_1.01,0.2069375991821289
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,384,8,32,power_law_1.01,0.2579967975616455
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,384,8,32,balanced,0.8001013596852621
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,384,8,32,power_law_1.01,0.32785279750823976
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,384,8,32,power_law_1.01,0.48514561653137206
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,7168,2048,8,384,8,32,balanced,3.406709353129069
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,7168,2048,8,384,8,32,power_law_1.2,0.2138432025909424
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,7168,2048,8,384,8,32,power_law_1.2,0.2917952060699463
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,384,8,32,power_law_1.01,0.587007999420166
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,7168,2048,8,384,8,32,power_law_1.2,0.21790080070495604
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,384,8,32,power_law_1.01,0.9290495872497558
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,7168,2048,8,384,8,32,balanced,3.747653325398763
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,7168,2048,8,384,8,32,power_law_1.2,0.11292799711227416
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,384,8,32,balanced,0.9843413035074869
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,7168,2048,8,384,8,32,power_law_1.2,0.14589439630508422
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,384,8,32,power_law_1.01,1.2751104354858398
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,7168,2048,8,384,8,32,power_law_1.2,0.17216639518737792
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,384,8,32,power_law_1.01,1.5673215866088868
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,7168,2048,8,384,8,32,power_law_1.2,0.18518400192260742
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,7168,2048,8,384,8,32,power_law_1.2,0.23342719078063964
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,384,8,32,power_law_1.01,2.4753408432006836
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,7168,2048,8,384,8,32,power_law_1.2,0.22880640029907226
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,384,8,32,power_law_1.01,4.761465454101563
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,7168,2048,8,384,8,32,power_law_1.2,0.23544321060180665
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,7168,2048,8,384,8,32,power_law_1.2,0.23601279258728028
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,7168,2048,8,384,8,32,power_law_1.2,0.23728640079498292
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,7168,2048,8,384,8,32,power_law_1.2,0.26175999641418457
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,7168,2048,8,384,8,32,power_law_1.2,0.24949119091033936
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,384,8,32,balanced,1.532815933227539
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,7168,2048,8,384,8,32,power_law_1.2,0.25760641098022463
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,7168,2048,8,384,8,32,power_law_1.2,0.24450559616088868
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,7168,2048,8,384,8,32,power_law_1.2,0.2696703910827637
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,7168,2048,8,384,8,32,power_law_1.2,0.27961599826812744
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,7168,2048,8,384,8,32,power_law_1.2,0.13472000360488892
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,7168,2048,8,384,8,32,power_law_1.2,0.309497594833374
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,7168,2048,8,384,8,32,power_law_1.2,0.34872961044311523
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,7168,2048,8,384,8,32,power_law_1.2,0.1835263967514038
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,7168,2048,8,384,8,32,power_law_1.2,0.12369279861450196
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,7168,2048,8,384,8,32,power_law_1.2,0.41366400718688967
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,7168,2048,8,384,8,32,power_law_1.2,0.08298879861831665
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,7168,2048,8,384,8,32,power_law_1.2,0.504633617401123
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,7168,2048,8,384,8,32,power_law_1.2,0.1183743953704834
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,7168,2048,8,384,8,32,power_law_1.2,0.5872704029083252
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,7168,2048,8,384,8,32,power_law_1.2,0.11448960304260254
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,7168,2048,8,384,8,32,power_law_1.2,0.8270463943481445
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,7168,2048,8,384,8,32,power_law_1.2,0.1368384003639221
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,7168,2048,8,384,8,32,power_law_1.2,1.0412799835205078
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,7168,2048,8,384,8,32,power_law_1.2,0.15374720096588135
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,7168,2048,8,384,8,32,power_law_1.2,0.15737600326538087
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,7168,2048,8,384,8,32,power_law_1.2,1.556991958618164
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,7168,2048,8,384,8,32,power_law_1.2,0.14555519819259644
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,7168,2048,8,384,8,32,power_law_1.2,1.7999231338500976
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,7168,2048,8,384,8,32,power_law_1.2,0.15521279573440552
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,7168,2048,8,384,8,32,power_law_1.2,2.360371208190918
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,7168,2048,8,384,8,32,power_law_1.2,0.13865599632263184
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,7168,2048,8,384,8,32,power_law_1.2,3.748505783081055
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,7168,2048,8,384,8,32,power_law_1.2,0.16539520025253296
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,7168,2048,8,384,8,32,power_law_1.2,0.1758784055709839
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,7168,2048,8,384,8,32,power_law_1.2,8.126252746582031
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,7168,2048,8,384,8,32,power_law_1.2,0.17224960327148436
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,7168,2048,8,384,8,32,power_law_1.2,0.17681920528411865
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,7168,2048,8,384,8,32,power_law_1.2,0.18888959884643555
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,384,8,32,balanced,2.989760080973307
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,7168,2048,8,384,8,32,power_law_1.2,0.19971200227737426
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,7168,2048,8,384,8,32,power_law_1.2,0.2121216058731079
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,7168,2048,8,384,8,32,power_law_1.2,0.25605120658874514
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,7168,2048,8,384,8,32,power_law_1.2,0.3354111909866333
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,7168,2048,8,384,8,32,power_law_1.2,0.39244799613952636
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,7168,2048,8,384,8,32,power_law_1.2,0.5059648036956788
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,7168,2048,8,384,8,32,power_law_1.2,0.6684351921081543
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,7168,2048,8,384,16,16,balanced,0.053898667295773826
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,7168,2048,8,384,8,32,power_law_1.2,0.8028160095214844
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,7168,2048,8,384,16,16,balanced,0.05469333132108053
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,7168,2048,8,384,8,32,power_law_1.2,1.2814592361450194
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,7168,2048,8,384,16,16,balanced,0.055173332492510475
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,7168,2048,8,384,8,32,power_law_1.2,1.5477248191833497
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,7168,2048,8,384,8,32,power_law_1.2,0.06165760159492493
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,7168,2048,8,384,16,16,balanced,0.05879466732343038
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,7168,2048,8,384,8,32,power_law_1.2,1.9605567932128907
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,7168,2048,8,384,16,16,balanced,0.06621333460013072
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,7168,2048,8,384,8,32,power_law_1.2,0.06727039813995361
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,7168,2048,8,384,16,16,balanced,0.07598933577537537
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,7168,2048,8,384,8,32,power_law_1.2,3.0617279052734374
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,7168,2048,8,384,8,32,power_law_1.2,0.06235520243644714
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,7168,2048,8,384,16,16,balanced,0.08542933066685994
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,7168,2048,8,384,8,32,power_law_1.2,0.053465598821640016
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,7168,2048,8,384,16,16,balanced,0.08661333719889323
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,7168,2048,8,384,8,32,power_law_1.2,6.545990753173828
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,7168,2048,8,384,16,16,balanced,0.08618666728337605
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,7168,2048,8,384,8,32,power_law_1.2,0.057017600536346434
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,7168,2048,8,384,16,16,balanced,0.08691733082135518
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,7168,2048,8,384,8,32,power_law_1.2,0.05902079939842224
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,7168,2048,8,384,16,16,balanced,0.0881173312664032
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,7168,2048,8,384,8,32,power_law_1.2,0.061408001184463504
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,7168,2048,8,384,16,16,balanced,0.0904319981733958
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,7168,2048,8,384,8,32,power_law_1.2,0.0639743983745575
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,7168,2048,8,384,16,16,balanced,0.09016533692677815
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,7168,2048,8,384,8,32,power_law_1.2,0.06548479795455933
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,7168,2048,8,384,16,16,balanced,0.09313066800435384
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,7168,2048,8,384,8,32,power_law_1.2,0.06813439726829529
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,7168,2048,8,384,16,16,balanced,0.09689066807428996
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,7168,2048,8,384,16,16,balanced,0.0971999963124593
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,7168,2048,8,384,8,32,power_law_1.2,0.0695360004901886
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,7168,2048,8,384,16,16,balanced,0.10169066985448201
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,7168,2048,8,384,8,32,power_law_1.2,0.07462400197982788
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,7168,2048,8,384,16,16,balanced,0.10979732871055603
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,7168,2048,8,384,8,32,power_law_1.2,0.07749119997024537
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,7168,2048,8,384,16,16,balanced,0.12087466319402058
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,7168,2048,8,384,16,16,balanced,0.047397335370381675
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,7168,2048,8,384,8,32,power_law_1.2,0.0815936028957367
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,7168,2048,8,384,16,16,balanced,0.04798933366934458
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,7168,2048,8,384,8,32,power_law_1.2,0.08710399866104127
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,7168,2048,8,384,16,16,balanced,0.14056000113487244
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,7168,2048,8,384,16,16,balanced,0.04844800134499868
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,7168,2048,8,384,8,32,power_law_1.2,0.08983680009841918
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,7168,2048,8,384,16,16,balanced,0.0531626691420873
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,7168,2048,8,384,16,16,balanced,0.16218133767445883
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,7168,2048,8,384,8,32,power_law_1.2,0.10191999673843384
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,7168,2048,8,384,16,16,balanced,0.05950933198134104
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,7168,2048,8,384,16,16,balanced,0.06526400148868561
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,7168,2048,8,384,8,32,power_law_1.2,0.12449920177459717
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,7168,2048,8,384,16,16,balanced,0.1978773276011149
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,7168,2048,8,384,16,16,balanced,0.07378133138020833
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,384,8,32,power_law_1.2,0.14908159971237184
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,7168,2048,8,384,16,16,balanced,0.22827200094858804
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,7168,2048,8,384,16,16,balanced,0.07520000139872234
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,7168,2048,8,384,16,16,balanced,0.07528000076611836
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,7168,2048,8,384,16,16,balanced,0.07603199779987335
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,384,8,32,power_law_1.2,0.17779200077056884
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,7168,2048,8,384,16,16,balanced,0.29409066836039227
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,7168,2048,8,384,16,16,balanced,0.07830399771531422
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,384,8,32,power_law_1.2,0.2098304033279419
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,7168,2048,8,384,16,16,balanced,0.07935466865698497
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,384,8,32,power_law_1.2,0.3130111932754517
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,7168,2048,8,384,16,16,balanced,0.08158933122952779
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,7168,2048,8,384,16,16,balanced,0.046810666720072426
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,7168,2048,8,384,16,16,balanced,0.08247999846935272
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,7168,2048,8,384,16,16,balanced,0.37172265847524005
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,7168,2048,8,384,16,16,balanced,0.0470773329337438
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,7168,2048,8,384,16,16,power_law_1.01,0.0652351975440979
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,384,8,32,power_law_1.2,0.401580810546875
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,7168,2048,8,384,16,16,balanced,0.08889599641164143
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,7168,2048,8,384,16,16,balanced,0.0487306664387385
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,384,8,32,power_law_1.2,0.5866176128387451
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,7168,2048,8,384,16,16,power_law_1.01,0.07712640166282654
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,7168,2048,8,384,16,16,balanced,0.05366399884223938
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,7168,2048,8,384,16,16,balanced,0.09132267038027446
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,7168,2048,8,384,16,16,power_law_1.01,0.08426240086555481
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,7168,2048,8,384,16,16,balanced,0.05680533250172933
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,7168,2048,8,384,16,16,balanced,0.0969599982102712
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,7168,2048,8,384,16,16,power_law_1.01,0.06323199868202209
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,384,8,32,power_law_1.2,0.729702377319336
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,7168,2048,8,384,16,16,balanced,0.06649599969387054
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,7168,2048,8,384,16,16,balanced,0.10884267091751099
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,7168,2048,8,384,16,16,balanced,0.5150719881057739
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,7168,2048,8,384,16,16,power_law_1.01,0.06457599997520447
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,7168,2048,8,384,16,16,balanced,0.07739200194676717
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,384,8,32,power_law_1.2,0.9839167594909668
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,7168,2048,8,384,16,16,balanced,0.12251733740170796
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,7168,2048,8,384,16,16,balanced,0.07921066880226135
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,7168,2048,8,384,16,16,power_law_1.01,0.07036799788475037
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,7168,2048,8,384,16,16,balanced,0.0800906668106715
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,7168,2048,8,384,16,16,power_law_1.01,0.07310079932212829
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,384,8,32,power_law_1.2,1.7306751251220702
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,7168,2048,8,384,16,16,balanced,0.1472106675306956
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,7168,2048,8,384,16,16,balanced,0.07977066437403361
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,7168,2048,8,384,16,16,power_law_1.01,0.07780479788780212
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,384,8,32,power_law_1.2,1.7287168502807617
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,7168,2048,8,384,16,16,balanced,0.08193066716194153
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,7168,2048,8,384,16,16,balanced,0.17296000321706137
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,7168,2048,8,384,16,16,power_law_1.01,0.07780479788780212
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,7168,2048,8,384,16,16,balanced,0.08573333422342937
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,384,8,32,power_law_1.2,2.9494848251342773
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,7168,2048,8,384,16,16,power_law_1.01,0.07849599719047547
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,7168,2048,8,384,16,16,balanced,0.08602666854858398
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,7168,2048,8,384,16,16,balanced,0.21812800566355386
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,7168,2048,8,384,16,16,balanced,0.6690879662831625
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,7168,2048,8,384,16,16,power_law_1.01,0.08045439720153809
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,384,8,32,power_law_1.2,5.710009765625
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,7168,2048,8,384,16,16,balanced,0.08794132868448894
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,7168,2048,8,384,16,16,balanced,0.0943946639696757
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,7168,2048,8,384,16,16,power_law_1.01,0.08208640217781067
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,7168,2048,8,384,16,16,balanced,0.2656533320744832
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,7168,2048,8,384,16,16,balanced,0.09678399562835693
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,7168,2048,8,384,16,16,power_law_1.01,0.08611199855804444
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,7168,2048,8,384,16,16,balanced,0.10315733154614766
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,7168,2048,8,384,16,16,power_law_1.01,0.08757759928703308
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,7168,2048,8,384,16,16,power_law_1.01,0.09401599764823913
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,7168,2048,8,384,16,16,balanced,0.11647466818491618
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,7168,2048,8,384,16,16,balanced,0.3588266770044963
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,7168,2048,8,384,16,16,power_law_1.01,0.10176639556884766
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,7168,2048,8,384,16,16,power_law_1.01,0.10902400016784668
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,7168,2048,8,384,16,16,balanced,0.8128320376078287
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,384,16,16,balanced,0.13458133737246195
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,7168,2048,8,384,16,16,power_law_1.01,0.13148159980773927
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,7168,2048,8,384,16,16,balanced,0.463370680809021
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,7168,2048,8,384,16,16,power_law_1.01,0.13623039722442626
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,7168,2048,8,384,16,16,power_law_1.01,0.16454399824142457
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,7168,2048,8,384,16,16,power_law_1.01,0.17882879972457885
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,384,16,16,balanced,0.16173866391181946
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,7168,2048,8,384,16,16,power_law_1.01,0.23665280342102052
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,384,16,16,balanced,0.18743999799092612
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,7168,2048,8,384,16,16,power_law_1.01,0.2795711994171143
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,7168,2048,8,384,16,16,balanced,0.657690684000651
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,7168,2048,8,384,16,16,power_law_1.01,0.062636798620224
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,7168,2048,8,384,16,16,power_law_1.01,0.3677311897277832
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,384,16,16,balanced,0.2350613276163737
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,7168,2048,8,384,16,16,power_law_1.01,0.06362879872322083
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,7168,2048,8,384,16,16,power_law_1.01,0.48470401763916016
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,7168,2048,8,384,16,16,power_law_1.01,0.06903679966926575
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,7168,2048,8,384,16,16,power_law_1.01,0.059628802537918094
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,7168,2048,8,384,16,16,power_law_1.01,0.6377600193023681
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,7168,2048,8,384,16,16,power_law_1.01,0.054527997970581055
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,7168,2048,8,384,16,16,power_law_1.01,0.060601598024368285
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,7168,2048,8,384,16,16,power_law_1.01,0.06754559874534607
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,7168,2048,8,384,16,16,power_law_1.01,0.8135680198669434
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,7168,2048,8,384,16,16,balanced,1.2535520394643147
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,7168,2048,8,384,16,16,power_law_1.01,0.06275839805603027
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,7168,2048,8,384,16,16,power_law_1.01,0.07584000229835511
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,7168,2048,8,384,16,16,power_law_1.01,0.06547200083732604
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,7168,2048,8,384,16,16,power_law_1.01,1.0761343955993652
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,7168,2048,8,384,16,16,balanced,0.8521813551584879
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,7168,2048,8,384,16,16,power_law_1.01,0.0677183985710144
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,7168,2048,8,384,16,16,power_law_1.01,0.05759360194206238
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,384,16,16,balanced,0.30850134293238324
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,7168,2048,8,384,16,16,power_law_1.01,0.06799359917640686
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,7168,2048,8,384,16,16,power_law_1.01,1.5539520263671875
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,7168,2048,8,384,16,16,power_law_1.01,0.06046079993247986
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,7168,2048,8,384,16,16,power_law_1.01,0.06904320120811462
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,7168,2048,8,384,16,16,power_law_1.01,0.06581760048866273
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,7168,2048,8,384,16,16,power_law_1.01,0.07269759774208069
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,7168,2048,8,384,16,16,power_law_1.01,3.3315200805664062
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,7168,2048,8,384,16,16,power_law_1.01,0.06909440159797668
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,7168,2048,8,384,16,16,power_law_1.01,0.0749504029750824
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,384,16,16,balanced,0.4214613437652588
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,7168,2048,8,384,16,16,power_law_1.01,0.07843199968338013
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,7168,2048,8,384,16,16,power_law_1.01,0.07383040189743043
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,7168,2048,8,384,16,16,power_law_1.01,0.08177279829978942
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,7168,2048,8,384,16,16,power_law_1.01,0.07418879866600037
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,7168,2048,8,384,16,16,power_law_1.01,0.09054080247879029
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,7168,2048,8,384,16,16,power_law_1.01,0.07615360021591186
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,7168,2048,8,384,16,16,power_law_1.01,0.09639679789543151
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,384,16,16,balanced,0.5806933244069418
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,7168,2048,8,384,16,16,power_law_1.01,0.07763199806213379
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,7168,2048,8,384,16,16,power_law_1.01,0.1020095944404602
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,7168,2048,8,384,16,16,balanced,1.0460533301035564
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,7168,2048,8,384,16,16,power_law_1.01,0.12164479494094849
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,7168,2048,8,384,16,16,power_law_1.01,0.08165119886398316
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,7168,2048,8,384,16,16,power_law_1.01,0.1323583960533142
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,7168,2048,8,384,16,16,power_law_1.01,0.08350080251693726
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,7168,2048,8,384,16,16,power_law_1.01,0.16459519863128663
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,7168,2048,8,384,16,16,power_law_1.01,0.18447359800338745
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,7168,2048,8,384,16,16,power_law_1.01,0.09114239811897278
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,7168,2048,8,384,16,16,power_law_1.01,0.25347840785980225
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,7168,2048,8,384,16,16,power_law_1.01,0.09937279820442199
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,7168,2048,8,384,16,16,power_law_1.01,0.28769280910491946
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,384,16,16,balanced,0.8015999794006348
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,7168,2048,8,384,16,16,power_law_1.01,0.10580480098724365
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,7168,2048,8,384,16,16,power_law_1.2,0.06805760264396668
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,7168,2048,8,384,16,16,power_law_1.01,0.42225918769836424
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,7168,2048,8,384,16,16,power_law_1.01,0.5337408065795899
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,7168,2048,8,384,16,16,power_law_1.01,0.11465599536895751
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,7168,2048,8,384,16,16,power_law_1.2,0.07740799784660339
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,7168,2048,8,384,16,16,power_law_1.01,0.7848063945770264
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,7168,2048,8,384,16,16,power_law_1.01,0.14257279634475709
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,7168,2048,8,384,16,16,power_law_1.2,0.07741439938545228
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,7168,2048,8,384,16,16,power_law_1.01,0.967750358581543
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,7168,2048,8,384,16,16,power_law_1.2,0.06181120276451111
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,7168,2048,8,384,16,16,power_law_1.01,1.209113597869873
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,384,16,16,power_law_1.01,0.16051199436187744
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,7168,2048,8,384,16,16,power_law_1.2,0.06536319851875305
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,7168,2048,8,384,16,16,power_law_1.01,1.9795455932617188
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,7168,2048,8,384,16,16,power_law_1.2,0.06972799897193908
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,7168,2048,8,384,16,16,power_law_1.01,3.7323646545410156
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,7168,2048,8,384,16,16,power_law_1.2,0.07334399819374085
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,384,16,16,power_law_1.01,0.20239999294281005
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,7168,2048,8,384,16,16,balanced,1.6424585978190105
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,7168,2048,8,384,16,16,power_law_1.2,0.07812479734420777
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,384,16,16,power_law_1.01,0.22277119159698486
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,7168,2048,8,384,16,16,balanced,2.3650399843851724
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,384,16,16,balanced,1.0683893362681072
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,7168,2048,8,384,16,16,power_law_1.2,0.07680000066757202
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,384,16,16,power_law_1.01,0.3602303981781006
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,7168,2048,8,384,16,16,power_law_1.2,0.07850239872932434
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,7168,2048,8,384,16,16,power_law_1.2,0.08054400086402894
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,384,16,16,power_law_1.01,0.4333439826965332
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,7168,2048,8,384,16,16,power_law_1.2,0.08201599717140198
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,384,16,16,power_law_1.01,0.6109951972961426
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,7168,2048,8,384,16,16,power_law_1.2,0.08389760255813598
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,384,16,16,power_law_1.01,0.7742527961730957
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,7168,2048,8,384,16,16,power_law_1.2,0.09004799723625183
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,384,16,16,power_law_1.01,1.1924415588378907
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,384,16,16,balanced,1.3163200219472249
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,7168,2048,8,384,16,16,power_law_1.2,0.09847040176391601
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,7168,2048,8,384,16,16,power_law_1.2,0.10299520492553711
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,384,16,16,power_law_1.01,1.4647744178771973
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,7168,2048,8,384,16,16,power_law_1.2,0.11366399526596069
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,7168,2048,8,384,16,16,power_law_1.2,0.13056000471115112
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,384,16,16,power_law_1.01,1.890060806274414
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,7168,2048,8,384,16,16,power_law_1.2,0.13389439582824708
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,384,16,16,power_law_1.01,2.823801612854004
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,7168,2048,8,384,16,16,power_law_1.2,0.16747519969940186
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,7168,2048,8,384,16,16,power_law_1.2,0.208787202835083
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,384,16,16,power_law_1.01,6.265958404541015
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,7168,2048,8,384,16,16,power_law_1.2,0.2779520034790039
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,7168,2048,8,384,16,16,power_law_1.2,0.31354238986968996
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,7168,2048,8,384,16,16,power_law_1.2,0.40265598297119143
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,7168,2048,8,384,16,16,power_law_1.2,0.5582911968231201
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,384,16,16,balanced,2.0606719652811685
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,7168,2048,8,384,16,16,power_law_1.2,0.7754240036010742
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,7168,2048,8,384,16,16,balanced,3.1795787811279297
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,7168,2048,8,384,16,16,power_law_1.2,0.9494336128234864
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,7168,2048,8,384,16,16,power_law_1.2,1.1090687751770019
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,7168,2048,8,384,16,16,power_law_1.2,0.05792639851570129
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,7168,2048,8,384,16,16,power_law_1.2,1.8593984603881837
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,7168,2048,8,384,16,16,power_law_1.2,0.06501759886741638
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,7168,2048,8,384,16,16,power_law_1.2,0.05787519812583923
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,7168,2048,8,384,16,16,power_law_1.2,3.618316650390625
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,7168,2048,8,384,16,16,power_law_1.2,0.05354239940643311
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,7168,2048,8,384,16,16,power_law_1.2,0.06209920048713684
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,7168,2048,8,384,16,16,power_law_1.2,0.060710400342941284
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,7168,2048,8,384,16,16,power_law_1.2,0.06209920048713684
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,7168,2048,8,384,16,16,power_law_1.2,0.06702719926834107
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,7168,2048,8,384,16,16,power_law_1.2,0.06795520186424256
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,7168,2048,8,384,16,16,power_law_1.2,0.06903679966926575
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,7168,2048,8,384,16,16,power_law_1.2,0.07182719707489013
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,7168,2048,8,384,16,16,power_law_1.2,0.07487360239028931
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,7168,2048,8,384,16,16,power_law_1.2,0.07769600152969361
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,7168,2048,8,384,16,16,power_law_1.2,0.08056319952011108
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,7168,2048,8,384,16,16,power_law_1.2,0.09134719967842102
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,7168,2048,8,384,16,16,power_law_1.2,0.09459199905395507
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,384,16,16,balanced,4.030917485555013
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,7168,2048,8,384,16,16,power_law_1.2,0.10274560451507568
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,7168,2048,8,384,16,16,power_law_1.2,0.12421120405197143
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,7168,2048,8,384,16,16,power_law_1.2,0.1381824016571045
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,7168,2048,8,384,16,16,power_law_1.2,0.17501440048217773
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,7168,2048,8,384,16,16,power_law_1.2,0.20136959552764894
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,7168,2048,8,384,16,16,power_law_1.2,0.278112006187439
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,7168,2048,8,384,16,16,power_law_1.2,0.3211967945098877
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,7168,2048,8,384,16,16,power_law_1.2,0.4457536220550537
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,7168,2048,8,384,16,16,power_law_1.2,0.5700032234191894
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,7168,2048,8,384,16,16,power_law_1.2,0.8503616333007813
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1,7168,2048,8,384,16,16,power_law_1.2,0.05968639850616455
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,7168,2048,8,384,16,16,power_law_1.2,1.0843135833740234
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2,7168,2048,8,384,16,16,power_law_1.2,0.06789119839668274
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4,7168,2048,8,384,16,16,power_law_1.2,0.05737599730491638
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,7168,2048,8,384,16,16,power_law_1.2,1.3256447792053223
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8,7168,2048,8,384,16,16,power_law_1.2,0.05475839972496033
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,7168,2048,8,384,16,16,power_law_1.2,2.227078437805176
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16,7168,2048,8,384,16,16,power_law_1.2,0.058719998598098753
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32,7168,2048,8,384,16,16,power_law_1.2,0.0636672019958496
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,7168,2048,8,384,16,16,power_law_1.2,4.536243057250976
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,48,7168,2048,8,384,16,16,power_law_1.2,0.06855040192604064
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,7168,2048,8,384,32,8,balanced,0.055760001142819725
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,64,7168,2048,8,384,16,16,power_law_1.2,0.07278079986572265
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,7168,2048,8,384,32,8,balanced,0.055120001236597695
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,80,7168,2048,8,384,16,16,power_law_1.2,0.07474560141563416
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,7168,2048,8,384,32,8,balanced,0.05691733459631602
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,7168,2048,8,384,32,8,balanced,0.0614026685555776
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,96,7168,2048,8,384,16,16,power_law_1.2,0.07538560032844543
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,7168,2048,8,384,32,8,balanced,0.07011199990908305
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,7168,2048,8,384,32,8,balanced,0.09427733222643535
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,128,7168,2048,8,384,16,16,power_law_1.2,0.07770879864692688
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,7168,2048,8,384,32,8,balanced,0.10764799515406291
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,160,7168,2048,8,384,16,16,power_law_1.2,0.08284159898757934
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,7168,2048,8,384,32,8,balanced,0.10282133022944133
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,7168,2048,8,384,32,8,balanced,0.10373333096504211
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,192,7168,2048,8,384,16,16,power_law_1.2,0.08542079925537109
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,7168,2048,8,384,32,8,balanced,0.1051626702149709
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,7168,2048,8,384,32,8,balanced,0.0480373352766037
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,7168,2048,8,384,32,8,balanced,0.10575999816258748
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,256,7168,2048,8,384,16,16,power_law_1.2,0.09240959882736206
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,7168,2048,8,384,32,8,balanced,0.04858666658401489
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,7168,2048,8,384,32,8,balanced,0.10691733161608379
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,320,7168,2048,8,384,16,16,power_law_1.2,0.0992959976196289
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,7168,2048,8,384,32,8,balanced,0.050053333242734276
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,7168,2048,8,384,32,8,balanced,0.05593066910902659
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,7168,2048,8,384,32,8,balanced,0.10912533601125081
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,384,7168,2048,8,384,16,16,power_law_1.2,0.10528000593185424
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,7168,2048,8,384,32,8,balanced,0.06087466577688853
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,7168,2048,8,384,32,8,balanced,0.10732799768447876
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,512,7168,2048,8,384,16,16,power_law_1.2,0.11521919965744018
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,7168,2048,8,384,32,8,balanced,0.08107733229796092
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,768,7168,2048,8,384,16,16,power_law_1.2,0.14058879613876343
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,7168,2048,8,384,32,8,balanced,0.09092799822489421
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,7168,2048,8,384,32,8,balanced,0.11973866820335388
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,7168,2048,8,384,32,8,balanced,0.09329066673914592
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,7168,2048,8,384,32,8,balanced,0.11815466483434041
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,7168,2048,8,384,32,8,balanced,0.09289600451787312
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,384,16,16,power_law_1.2,0.1735103964805603
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,7168,2048,8,384,32,8,balanced,0.09342933694521587
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,7168,2048,8,384,32,8,balanced,0.12102933724721272
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,7168,2048,8,384,32,8,balanced,0.09488000472386678
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,7168,2048,8,384,32,8,balanced,0.13750933607419333
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,7168,2048,8,384,32,8,balanced,0.09656000137329102
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,384,16,16,power_law_1.2,0.1960960030555725
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,7168,2048,8,384,32,8,balanced,0.09808533390363057
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,7168,2048,8,384,32,8,balanced,0.14801599582036337
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,384,16,16,power_law_1.2,0.26071040630340575
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,7168,2048,8,384,32,8,balanced,0.09967999656995137
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,7168,2048,8,384,32,8,balanced,0.10735999544461568
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,384,16,16,power_law_1.2,0.36487040519714353
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,7168,2048,8,384,32,8,balanced,0.17081065972646078
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,7168,2048,8,384,32,8,balanced,0.10988266269365947
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,7168,2048,8,384,32,8,balanced,0.1156160036722819
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,7168,2048,8,384,32,8,balanced,0.1949440042177836
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,7168,2048,8,384,32,8,balanced,0.13040533661842346
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,384,16,16,power_law_1.2,0.44214401245117185
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,7168,2048,8,384,32,8,balanced,0.14433599511782327
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,384,16,16,power_law_1.2,0.6835072040557861
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,7168,2048,8,384,32,8,balanced,0.2321760058403015
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,7168,2048,8,384,32,8,balanced,0.17291200160980225
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,384,16,16,power_law_1.2,0.9004223823547364
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,384,16,16,power_law_1.2,1.2142016410827636
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,7168,2048,8,384,32,8,balanced,0.2070080041885376
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,7168,2048,8,384,32,8,balanced,0.2818506757418315
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,7168,2048,8,384,32,8,balanced,0.2579893271128337
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,384,16,16,power_law_1.2,1.5987775802612305
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,7168,2048,8,384,32,8,power_law_1.01,0.06154879927635193
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,7168,2048,8,384,32,8,balanced,0.37477866808573407
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,384,16,16,power_law_1.2,2.1954431533813477
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,7168,2048,8,384,32,8,balanced,0.3180053234100342
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,7168,2048,8,384,32,8,power_law_1.01,0.06234880089759827
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,384,16,16,power_law_1.2,3.609535980224609
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,7168,2048,8,384,32,8,power_law_1.01,0.08403840065002441
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,7168,2048,8,384,32,8,power_law_1.01,0.06335999965667724
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,384,16,16,power_law_1.2,7.314080047607422
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,7168,2048,8,384,32,8,balanced,0.47789867719014484
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,7168,2048,8,384,32,8,power_law_1.01,0.06800640225410462
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,7168,2048,8,384,32,8,balanced,0.4373279809951782
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,7168,2048,8,384,32,8,power_law_1.01,0.082777601480484
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,7168,2048,8,384,32,8,power_law_1.01,0.08814719915390015
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,7168,2048,8,384,32,8,power_law_1.01,0.09204480051994324
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,7168,2048,8,384,32,8,balanced,0.5660053491592407
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,7168,2048,8,384,32,8,power_law_1.01,0.053452801704406736
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,7168,2048,8,384,32,8,power_law_1.01,0.09267200231552124
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,7168,2048,8,384,32,8,balanced,0.6739359696706136
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,7168,2048,8,384,32,8,power_law_1.01,0.09604480266571044
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,7168,2048,8,384,32,8,power_law_1.01,0.05672320127487183
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,7168,2048,8,384,32,8,power_law_1.01,0.09811840057373047
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,7168,2048,8,384,32,8,power_law_1.01,0.07171840071678162
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,7168,2048,8,384,32,8,power_law_1.01,0.10170880556106568
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,7168,2048,8,384,32,8,power_law_1.01,0.054425597190856934
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,7168,2048,8,384,32,8,power_law_1.01,0.10955519676208496
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,7168,2048,8,384,32,8,balanced,0.8106133143107096
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,7168,2048,8,384,32,8,power_law_1.01,0.06280320286750793
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,7168,2048,8,384,32,8,power_law_1.01,0.10652799606323242
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,7168,2048,8,384,32,8,power_law_1.01,0.07004799842834472
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,7168,2048,8,384,32,8,power_law_1.01,0.11507840156555176
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,7168,2048,8,384,32,8,power_law_1.01,0.07352319955825806
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,7168,2048,8,384,32,8,balanced,0.8616800308227539
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,7168,2048,8,384,32,8,power_law_1.01,0.12259839773178101
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,7168,2048,8,384,32,8,power_law_1.01,0.08035839796066284
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,7168,2048,8,384,32,8,power_law_1.01,0.12881920337677003
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,7168,2048,8,384,32,8,power_law_1.01,0.1522112011909485
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,7168,2048,8,384,32,8,power_law_1.01,0.08232960104942322
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,7168,2048,8,384,32,8,power_law_1.01,0.18246400356292725
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,7168,2048,8,384,32,8,power_law_1.01,0.08433279991149903
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,7168,2048,8,384,32,8,power_law_1.01,0.23276159763336182
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,7168,2048,8,384,32,8,balanced,1.0420640309651692
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,7168,2048,8,384,32,8,power_law_1.01,0.0865664005279541
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,7168,2048,8,384,32,8,power_law_1.01,0.23417599201202394
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,7168,2048,8,384,32,8,power_law_1.01,0.08856959939002991
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,7168,2048,8,384,32,8,power_law_1.01,0.29792640209197996
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,7168,2048,8,384,32,8,power_law_1.01,0.09047679901123047
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,7168,2048,8,384,32,8,power_law_1.01,0.3593983888626099
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,7168,2048,8,384,32,8,power_law_1.01,0.10032000541687011
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,7168,2048,8,384,32,8,power_law_1.01,0.4782847881317139
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,7168,2048,8,384,32,8,balanced,1.0637333393096924
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,7168,2048,8,384,32,8,power_law_1.01,0.10826879739761353
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,7168,2048,8,384,32,8,power_law_1.01,0.577504014968872
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,7168,2048,8,384,32,8,power_law_1.01,0.11952639818191528
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,7168,2048,8,384,32,8,power_law_1.01,0.7912447929382325
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,7168,2048,8,384,32,8,power_law_1.01,0.1223423957824707
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,7168,2048,8,384,32,8,power_law_1.01,1.049062442779541
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,7168,2048,8,384,32,8,balanced,1.2899680137634277
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,7168,2048,8,384,32,8,power_law_1.01,0.14803199768066405
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,7168,2048,8,384,32,8,power_law_1.01,1.312953567504883
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,7168,2048,8,384,32,8,power_law_1.01,0.1542464017868042
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,7168,2048,8,384,32,8,power_law_1.01,2.066054344177246
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,7168,2048,8,384,32,8,power_law_1.01,0.20074241161346434
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,7168,2048,8,384,32,8,power_law_1.01,0.21932799816131593
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,7168,2048,8,384,32,8,power_law_1.01,3.8492286682128904
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,7168,2048,8,384,32,8,power_law_1.01,0.2941567897796631
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,7168,2048,8,384,32,8,power_law_1.01,0.35538558959960936
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,7168,2048,8,384,32,8,power_law_1.01,0.5263552188873291
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,7168,2048,8,384,32,8,power_law_1.01,0.6484928131103516
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,7168,2048,8,384,32,8,balanced,1.6713493665059407
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,7168,2048,8,384,32,8,power_law_1.01,0.8976192474365234
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,7168,2048,8,384,32,8,power_law_1.01,1.2313471794128419
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,7168,2048,8,384,32,8,power_law_1.01,1.5652607917785644
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,7168,2048,8,384,32,8,balanced,2.023914655049642
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,7168,2048,8,384,32,8,power_law_1.01,2.301254463195801
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1,7168,2048,8,384,32,8,power_law_1.2,0.06158080101013184
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2,7168,2048,8,384,32,8,power_law_1.2,0.06264320015907288
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,7168,2048,8,384,32,8,power_law_1.01,4.551891326904297
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4,7168,2048,8,384,32,8,power_law_1.2,0.06789759993553161
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8,7168,2048,8,384,32,8,power_law_1.2,0.06324480175971985
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16,7168,2048,8,384,32,8,power_law_1.2,0.06561279892921448
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32,7168,2048,8,384,32,8,power_law_1.2,0.0802944004535675
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,48,7168,2048,8,384,32,8,power_law_1.2,0.08522239923477173
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,64,7168,2048,8,384,32,8,power_law_1.2,0.09156479835510253
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,80,7168,2048,8,384,32,8,power_law_1.2,0.09165440201759338
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,96,7168,2048,8,384,32,8,power_law_1.2,0.09411839842796325
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,128,7168,2048,8,384,32,8,power_law_1.2,0.1004032015800476
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,160,7168,2048,8,384,32,8,power_law_1.2,0.10619519948959351
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,192,7168,2048,8,384,32,8,power_law_1.2,0.10698879957199096
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,256,7168,2048,8,384,32,8,power_law_1.2,0.10682879686355591
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,320,7168,2048,8,384,32,8,power_law_1.2,0.11604479551315308
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,384,7168,2048,8,384,32,8,power_law_1.2,0.12721920013427734
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,512,7168,2048,8,384,32,8,power_law_1.2,0.13059200048446656
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,7168,2048,8,384,32,8,balanced,3.076618512471517
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,768,7168,2048,8,384,32,8,power_law_1.2,0.153766405582428
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1024,7168,2048,8,384,32,8,power_law_1.2,0.19302400350570678
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,1536,7168,2048,8,384,32,8,power_law_1.2,0.23578879833221436
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,2048,7168,2048,8,384,32,8,power_law_1.2,0.24997119903564452
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,7168,2048,8,384,32,8,balanced,3.903898557027181
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,3072,7168,2048,8,384,32,8,power_law_1.2,0.30906240940093993
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,4096,7168,2048,8,384,32,8,power_law_1.2,0.3754048109054565
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,6144,7168,2048,8,384,32,8,power_law_1.2,0.49635839462280273
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,8192,7168,2048,8,384,32,8,power_law_1.2,0.6254528045654297
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,12288,7168,2048,8,384,32,8,power_law_1.2,0.8471360206604004
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,16384,7168,2048,8,384,32,8,power_law_1.2,1.138758373260498
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,20480,7168,2048,8,384,32,8,power_law_1.2,1.3790975570678712
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,32768,7168,2048,8,384,32,8,power_law_1.2,2.211507225036621
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,float16,65536,7168,2048,8,384,32,8,power_law_1.2,4.527212905883789
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1,7168,2048,8,384,32,8,power_law_1.2,0.053260797262191774
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2,7168,2048,8,384,32,8,power_law_1.2,0.056831997632980344
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4,7168,2048,8,384,32,8,power_law_1.2,0.06261119842529297
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8,7168,2048,8,384,32,8,power_law_1.2,0.05624319911003113
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16,7168,2048,8,384,32,8,power_law_1.2,0.06257920265197754
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32,7168,2048,8,384,32,8,power_law_1.2,0.06938239932060242
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,48,7168,2048,8,384,32,8,power_law_1.2,0.07010560035705567
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,64,7168,2048,8,384,32,8,power_law_1.2,0.08055679798126221
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,80,7168,2048,8,384,32,8,power_law_1.2,0.08279680013656616
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,96,7168,2048,8,384,32,8,power_law_1.2,0.0825984001159668
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,128,7168,2048,8,384,32,8,power_law_1.2,0.08416640162467956
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,160,7168,2048,8,384,32,8,power_law_1.2,0.08866559863090515
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,192,7168,2048,8,384,32,8,power_law_1.2,0.09101439714431762
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,128,2,128,balanced,0.04206933577855428
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,256,7168,2048,8,384,32,8,power_law_1.2,0.09989759922027588
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,320,7168,2048,8,384,32,8,power_law_1.2,0.1125823974609375
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,128,2,128,balanced,0.044010668992996216
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,384,7168,2048,8,384,32,8,power_law_1.2,0.11662080287933349
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,128,2,128,balanced,0.04404800136884054
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,512,7168,2048,8,384,32,8,power_law_1.2,0.12486399412155151
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,128,2,128,balanced,0.04934933284918467
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,768,7168,2048,8,384,32,8,power_law_1.2,0.15114879608154297
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,128,2,128,balanced,0.05363733569780985
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,128,2,128,power_law_1.01,0.0419840008020401
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,128,2,128,balanced,0.06465066472689311
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1024,7168,2048,8,384,32,8,power_law_1.2,0.16397440433502197
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,128,2,128,power_law_1.01,0.04376960098743439
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,128,2,128,balanced,0.060346667965253196
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,1536,7168,2048,8,384,32,8,power_law_1.2,0.20495359897613524
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,128,2,128,power_law_1.01,0.043110400438308716
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,128,2,128,balanced,0.059936001896858215
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,2048,7168,2048,8,384,32,8,power_law_1.2,0.22709119319915771
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,128,2,128,power_law_1.01,0.04730879962444305
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,128,2,128,balanced,0.06781866649786632
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,3072,7168,2048,8,384,32,8,power_law_1.2,0.3061376094818115
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,128,2,128,power_law_1.01,0.04965760111808777
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,128,2,128,balanced,0.06775466601053874
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,4096,7168,2048,8,384,32,8,power_law_1.2,0.3750848054885864
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,128,2,128,balanced,0.06803733110427856
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,128,2,128,power_law_1.01,0.05682560205459595
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,128,2,128,balanced,0.06700799862543742
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,6144,7168,2048,8,384,32,8,power_law_1.2,0.5176447868347168
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,128,2,128,power_law_1.01,0.05788159966468811
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,128,2,128,balanced,0.06883733471234639
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,128,2,128,power_law_1.01,0.05826560258865356
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,8192,7168,2048,8,384,32,8,power_law_1.2,0.6727424144744873
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,128,2,128,balanced,0.0689333329598109
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,128,2,128,power_law_1.01,0.06702719926834107
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,128,2,128,power_law_1.2,0.041555199027061465
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,12288,7168,2048,8,384,32,8,power_law_1.2,1.015180778503418
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,128,2,128,balanced,0.0701386680205663
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,128,2,128,power_law_1.01,0.06710399985313416
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,16384,7168,2048,8,384,32,8,power_law_1.2,1.290982437133789
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,128,2,128,power_law_1.2,0.0430400013923645
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,128,2,128,balanced,0.06969599922498067
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,128,2,128,power_law_1.01,0.06726400256156921
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,128,2,128,power_law_1.2,0.042419201135635375
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,128,2,128,balanced,0.07151466608047485
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,20480,7168,2048,8,384,32,8,power_law_1.2,1.5230719566345214
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,128,2,128,power_law_1.01,0.06714879870414733
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,128,2,128,power_law_1.2,0.046003198623657225
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,128,2,128,balanced,0.07434133191903432
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,128,2,128,power_law_1.01,0.06770560145378113
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,32768,7168,2048,8,384,32,8,power_law_1.2,2.402195167541504
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,128,2,128,power_law_1.2,0.04912639856338501
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,128,2,128,balanced,0.07728533446788788
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,128,2,128,power_law_1.01,0.06863359808921814
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,128,2,128,power_law_1.2,0.05606399774551392
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,128,2,128,balanced,0.08406399687131245
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,fp8,65536,7168,2048,8,384,32,8,power_law_1.2,5.589926528930664
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,128,2,128,power_law_1.01,0.06907520294189454
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,128,2,128,power_law_1.2,0.056543999910354616
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,128,2,128,power_law_1.01,0.06977279782295227
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,128,2,128,balanced,0.093941330909729
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,128,2,128,power_law_1.2,0.056908798217773435
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,128,2,128,power_law_1.01,0.07134079933166504
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,128,2,128,power_law_1.2,0.06641280055046081
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,128,2,128,balanced,0.11144000291824341
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,128,2,128,power_law_1.01,0.07555199861526489
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,128,2,128,power_law_1.2,0.0661184012889862
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,128,2,128,power_law_1.01,0.07859200239181519
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,128,2,128,balanced,0.12501333157221475
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,128,2,128,power_law_1.2,0.06624000072479248
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,128,2,128,power_law_1.01,0.08790400028228759
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,128,2,128,power_law_1.2,0.06649600267410279
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,128,2,128,balanced,0.15793599685033163
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,128,2,128,power_law_1.01,0.09955840110778809
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,128,2,128,power_law_1.2,0.06696320176124573
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,128,4,64,balanced,0.032245332996050514
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,128,2,128,power_law_1.01,0.14910080432891845
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,128,2,128,power_law_1.2,0.06771199703216553
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,128,4,64,balanced,0.03312533348798752
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,128,2,128,balanced,0.19557867447535196
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,128,2,128,power_law_1.01,0.17231359481811523
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,128,2,128,power_law_1.2,0.06877440214157104
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,128,4,64,balanced,0.03329599897066752
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,128,2,128,power_law_1.01,0.24274559020996095
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,128,4,64,balanced,0.03748800108830134
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,128,2,128,power_law_1.2,0.06939520239830017
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,128,4,64,balanced,0.03932799895604452
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,128,2,128,power_law_1.01,0.3235584020614624
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,128,2,128,power_law_1.2,0.0711296021938324
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,128,2,128,balanced,0.2799520095189412
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,128,4,64,balanced,0.04533333579699198
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,128,2,128,power_law_1.01,0.4573184013366699
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,128,2,128,power_law_1.2,0.07708160281181335
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,128,4,64,power_law_1.01,0.03224959969520569
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,128,4,64,balanced,0.05293866495291392
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,128,2,128,power_law_1.2,0.0780672013759613
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,128,2,128,power_law_1.01,0.6391104221343994
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,128,4,64,balanced,0.05256533126036326
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,128,4,64,power_law_1.01,0.03326080143451691
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,128,2,128,power_law_1.2,0.09836159944534302
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,128,2,128,power_law_1.01,0.7773248195648194
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,128,4,64,balanced,0.05294933418432871
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,128,4,64,power_law_1.01,0.033939200639724734
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,128,2,128,balanced,0.36370666821797687
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,128,2,128,power_law_1.2,0.13175679445266725
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,128,2,128,power_law_1.01,1.319827175140381
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,128,4,64,balanced,0.053583999474843345
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,128,4,64,power_law_1.01,0.036524799466133115
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,128,2,128,power_law_1.2,0.18315520286560058
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,128,4,64,balanced,0.053082664807637535
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,128,4,64,power_law_1.01,0.039577600359916684
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,128,2,128,power_law_1.01,2.634636878967285
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,128,2,128,power_law_1.2,0.21484799385070802
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,128,4,64,power_law_1.2,0.03235200047492981
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,128,4,64,balanced,0.053583999474843345
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,128,4,64,power_law_1.01,0.04349440038204193
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,128,2,128,power_law_1.2,0.34286720752716066
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,128,4,64,balanced,0.06052800019582113
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,128,4,64,power_law_1.2,0.033318400382995605
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,128,2,128,balanced,0.4501173496246338
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,128,4,64,power_law_1.01,0.05006080269813538
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,128,4,64,power_law_1.2,0.032576000690460204
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,128,4,64,balanced,0.06003733476003011
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,128,2,128,power_law_1.2,0.4373311996459961
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,128,4,64,power_law_1.2,0.036499199271202085
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,128,4,64,power_law_1.01,0.049932798743247984
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,128,4,64,balanced,0.060559997955958046
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,128,4,64,power_law_1.2,0.03902080059051514
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,128,2,128,power_law_1.2,0.7309184074401855
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,128,4,64,power_law_1.01,0.05117440223693848
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,128,4,64,power_law_1.2,0.042982399463653564
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,128,4,64,balanced,0.06052800019582113
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,128,2,128,power_law_1.2,0.8127039909362793
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,128,4,64,power_law_1.2,0.049747198820114136
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,128,4,64,power_law_1.01,0.04929920136928558
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,128,4,64,balanced,0.06200533111890157
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,128,4,64,power_law_1.2,0.049702399969100954
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,128,2,128,power_law_1.2,1.0816320419311523
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,128,4,64,power_law_1.01,0.051635199785232545
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,128,4,64,power_law_1.2,0.05000960230827332
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,128,4,64,balanced,0.06463466584682465
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,128,2,128,power_law_1.2,1.8513216018676757
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,128,4,64,power_law_1.2,0.049670401215553286
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,128,4,64,power_law_1.01,0.05187839865684509
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,128,2,128,balanced,0.7048213481903076
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,128,4,64,balanced,0.0685280015071233
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,128,4,64,power_law_1.2,0.0520576000213623
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,128,4,64,power_law_1.01,0.058764797449111936
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,128,2,128,power_law_1.2,4.0161792755126955
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,128,4,64,power_law_1.2,0.05321599841117859
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,128,4,64,balanced,0.07487999896208446
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,128,4,64,power_law_1.01,0.05857920050621033
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,128,4,64,power_law_1.2,0.05926399827003479
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,128,4,64,power_law_1.2,0.05882880091667175
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,128,4,64,balanced,0.08542933066685994
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,128,4,64,power_law_1.01,0.059443199634552
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,128,4,64,power_law_1.2,0.05915520191192627
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,128,4,64,power_law_1.01,0.05969280004501343
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,128,4,64,power_law_1.2,0.06085759997367859
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,128,4,64,balanced,0.102101335922877
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,128,4,64,power_law_1.2,0.0630016028881073
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,128,4,64,power_law_1.01,0.06208639740943909
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,128,4,64,power_law_1.2,0.06704000234603882
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,128,4,64,power_law_1.01,0.06695680022239685
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,128,4,64,balanced,0.11806399623552959
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,128,4,64,power_law_1.2,0.07154560089111328
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,128,4,64,power_law_1.2,0.08561919927597046
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,128,4,64,power_law_1.01,0.0681984007358551
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,128,4,64,power_law_1.2,0.10216319561004639
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,128,4,64,balanced,0.15813866257667542
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,128,4,64,power_law_1.01,0.07831040024757385
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,128,4,64,power_law_1.2,0.14484479427337646
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,128,4,64,power_law_1.2,0.1713088035583496
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,128,4,64,power_law_1.01,0.09995520114898682
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,128,4,64,power_law_1.2,0.25511679649353025
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,128,4,64,balanced,0.19055465857187906
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,128,4,64,power_law_1.01,0.11756160259246826
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,128,4,64,power_law_1.2,0.3457279920578003
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,128,8,32,balanced,0.029088000456492107
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,128,2,128,balanced,1.3804319699605305
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,128,4,64,power_law_1.2,0.4344768047332764
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,128,4,64,power_law_1.01,0.15871360301971435
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,128,8,32,balanced,0.030282666285832722
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,128,4,64,power_law_1.2,0.770739221572876
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,128,4,64,power_law_1.01,0.21575679779052734
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,128,8,32,balanced,0.030554667115211487
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,128,4,64,power_law_1.2,0.8473664283752441
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,128,4,64,balanced,0.26892266670862836
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,128,8,32,balanced,0.03324266771475474
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,128,4,64,power_law_1.01,0.2674367904663086
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,128,4,64,power_law_1.2,1.358694362640381
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,128,8,32,balanced,0.03533333291610082
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,128,4,64,power_law_1.01,0.3976639986038208
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,128,4,64,power_law_1.2,2.898598480224609
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,128,8,32,balanced,0.038618666430314384
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,128,4,64,power_law_1.01,0.5150976181030273
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,128,8,32,balanced,0.04307733476161957
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,128,4,64,balanced,0.3479626576105754
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,128,8,32,balanced,0.04293866455554962
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,128,4,64,power_law_1.01,0.6343423843383789
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,128,8,32,balanced,0.047168001532554626
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,128,4,64,power_law_1.01,1.0360063552856444
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,128,8,32,balanced,0.04604266583919525
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,128,4,64,power_law_1.01,2.097305679321289
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,128,8,32,balanced,0.04757333298524221
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,128,8,32,balanced,0.047354668378829956
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,128,4,64,balanced,0.43030401070912677
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,128,8,32,balanced,0.047781333327293396
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,128,8,32,balanced,0.04983466863632202
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,128,8,32,balanced,0.05009066561857859
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,128,8,32,balanced,0.05715199808279673
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,128,8,32,balanced,0.05819733440876007
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,128,8,32,balanced,0.06073066592216492
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,128,4,64,balanced,0.6717973550160726
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,128,8,32,balanced,0.06420266628265381
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,128,8,32,balanced,0.07179733117421468
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,128,8,32,balanced,0.08329600095748901
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,128,8,32,power_law_1.01,0.0302592009305954
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,128,8,32,balanced,0.10309333602587382
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,128,8,32,power_law_1.01,0.030643200874328612
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,128,8,32,power_law_1.01,0.02988159954547882
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,128,8,32,balanced,0.11917866269747417
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,128,8,32,power_law_1.01,0.03368319869041443
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,128,8,32,power_law_1.01,0.03511039912700653
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,128,8,32,balanced,0.1607253352801005
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,128,8,32,power_law_1.01,0.03769600093364715
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,128,8,32,balanced,0.19369600216547647
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,128,8,32,power_law_1.01,0.041388800740242
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,128,4,64,balanced,1.319701353708903
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,128,8,32,power_law_1.01,0.040940800309181215
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,128,8,32,power_law_1.01,0.04614399969577789
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,128,8,32,balanced,0.2646080056826274
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,128,8,32,power_law_1.01,0.04547840058803558
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,128,8,32,power_law_1.01,0.0471807986497879
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,128,8,32,power_law_1.01,0.04708479940891266
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,128,8,32,power_law_1.01,0.04748800098896026
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,128,8,32,balanced,0.34136001269022626
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,128,8,32,power_law_1.01,0.04954879879951477
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,128,8,32,power_law_1.01,0.049856001138687135
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,128,8,32,power_law_1.01,0.05717759728431702
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,128,8,32,power_law_1.01,0.05751039981842041
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,128,8,32,power_law_1.01,0.06398079991340637
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,128,8,32,balanced,0.42054935296376544
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,128,8,32,power_law_1.01,0.07017599940299987
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,128,8,32,power_law_1.2,0.0302592009305954
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,128,8,32,power_law_1.01,0.08112639784812928
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,128,8,32,power_law_1.01,0.09247360229492188
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,128,8,32,power_law_1.2,0.03088639974594116
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,128,8,32,power_law_1.01,0.11564799547195434
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,128,8,32,power_law_1.2,0.030099201202392577
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,128,8,32,power_law_1.2,0.03377920091152191
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,128,8,32,power_law_1.01,0.1352959990501404
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,128,8,32,power_law_1.2,0.03490560054779053
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,128,8,32,power_law_1.01,0.1968384027481079
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,128,8,32,balanced,0.6580426692962646
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,128,8,32,power_law_1.2,0.037574398517608645
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,128,8,32,power_law_1.01,0.2423935890197754
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,128,16,16,balanced,0.027402666707833607
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,128,8,32,power_law_1.2,0.04137600064277649
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,128,8,32,power_law_1.01,0.3666687965393066
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,128,16,16,balanced,0.029157333076000214
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,128,8,32,power_law_1.2,0.042080000042915344
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,128,8,32,power_law_1.01,0.4539648056030273
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,128,16,16,balanced,0.029152000943819683
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,128,8,32,power_law_1.2,0.045440000295639035
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,128,8,32,power_law_1.01,0.5719871997833252
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,128,16,16,balanced,0.03270400067170461
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,128,8,32,power_law_1.2,0.046675199270248414
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,128,8,32,power_law_1.01,0.9244480133056641
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,128,16,16,balanced,0.03382933388153712
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,128,8,32,power_law_1.2,0.04604800045490265
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,128,16,16,balanced,0.03480000048875809
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,128,8,32,power_law_1.01,1.7550527572631835
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,128,8,32,power_law_1.2,0.04847359955310822
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,128,16,16,balanced,0.03745600084463755
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,128,8,32,power_law_1.2,0.0473471999168396
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,128,16,16,balanced,0.03581333408753077
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,128,8,32,power_law_1.2,0.05066879987716675
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,128,16,16,balanced,0.04032533367474874
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,128,8,32,power_law_1.2,0.051123201847076416
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,128,16,16,balanced,0.04112533231576284
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,128,8,32,balanced,1.2904106775919597
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,128,8,32,power_law_1.2,0.057715201377868654
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,128,16,16,balanced,0.0390133336186409
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,128,8,32,power_law_1.2,0.06071680188179016
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,128,16,16,balanced,0.05324266850948334
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,128,16,16,power_law_1.01,0.028012800216674804
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,128,8,32,power_law_1.2,0.0690559983253479
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,128,16,16,balanced,0.054431999723116554
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,128,16,16,power_law_1.01,0.0315775990486145
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,128,16,16,balanced,0.049312000473340355
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,128,8,32,power_law_1.2,0.07131519913673401
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,128,16,16,power_law_1.2,0.027935999631881713
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,128,16,16,power_law_1.01,0.030796799063682555
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,128,16,16,power_law_1.01,0.03223040103912354
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,128,16,16,balanced,0.05072533090909322
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,128,8,32,power_law_1.2,0.08195199966430664
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,128,16,16,power_law_1.2,0.03133440017700195
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,128,16,16,power_law_1.01,0.032543998956680295
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,128,16,16,balanced,0.05427733560403188
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,128,8,32,power_law_1.2,0.09616000056266785
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,128,16,16,power_law_1.2,0.02879360020160675
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,128,16,16,power_law_1.01,0.03288320004940033
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,128,16,16,balanced,0.056133334835370384
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,128,8,32,power_law_1.2,0.12919679880142212
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,128,16,16,power_law_1.01,0.03620480000972748
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,128,16,16,power_law_1.2,0.03248000144958496
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,128,16,16,power_law_1.01,0.03472639918327332
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,128,8,32,power_law_1.2,0.1474560022354126
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,128,16,16,balanced,0.06443733473618825
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,128,16,16,power_law_1.2,0.03271040022373199
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,128,32,8,balanced,0.026181332767009735
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,128,16,16,power_law_1.01,0.040403199195861814
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,128,16,16,power_law_1.01,0.03988479971885681
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,128,16,16,power_law_1.2,0.033024001121521
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,128,16,16,balanced,0.06902933120727539
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,128,8,32,power_law_1.2,0.20661120414733886
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,128,32,8,balanced,0.027797333896160126
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,128,16,16,power_law_1.01,0.03788160085678101
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,128,16,16,power_law_1.2,0.03635840117931366
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,128,8,32,power_law_1.2,0.26966400146484376
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,128,32,8,balanced,0.02775999903678894
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,128,16,16,power_law_1.01,0.05070080161094666
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,128,16,16,balanced,0.07668800155321757
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,128,16,16,power_law_1.01,0.05223039984703064
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,128,16,16,power_law_1.2,0.03464959859848023
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,128,32,8,balanced,0.03159466634194056
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,128,8,32,power_law_1.2,0.4424767971038818
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,128,16,16,balanced,0.08858666817347209
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,128,16,16,power_law_1.01,0.05016319751739502
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,128,32,8,balanced,0.03294933338960012
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,128,16,16,power_law_1.2,0.040268799662590025
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,128,16,16,power_law_1.01,0.05124480128288269
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,128,8,32,power_law_1.2,0.537766408920288
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,128,16,16,balanced,0.10750400026639302
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,128,16,16,power_law_1.01,0.056364798545837404
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,128,32,8,balanced,0.035071998834609985
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,128,16,16,power_law_1.2,0.04010879993438721
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,128,8,32,power_law_1.2,0.7495039939880371
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,128,16,16,power_law_1.01,0.059673601388931276
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,128,32,8,balanced,0.03522666543722153
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,128,16,16,power_law_1.01,0.06911360025405884
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,128,16,16,power_law_1.2,0.0383103996515274
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,128,16,16,balanced,0.12369599938392639
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,128,8,32,power_law_1.2,1.1312576293945313
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,128,32,8,balanced,0.034527999659379326
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,128,16,16,power_law_1.01,0.07500159740447998
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,128,16,16,power_law_1.2,0.05306239724159241
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,128,16,16,power_law_1.01,0.08447359800338745
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,128,32,8,balanced,0.03710933278004328
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,128,8,32,power_law_1.2,2.477516746520996
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,128,16,16,power_law_1.01,0.09698560237884521
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,128,16,16,power_law_1.2,0.05259519815444946
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,128,16,16,balanced,0.1673226753870646
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,128,32,8,balanced,0.03749866783618927
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,128,16,16,power_law_1.01,0.11712640523910522
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,128,32,8,balanced,0.03623999903599421
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,128,16,16,power_law_1.01,0.13969919681549073
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,128,16,16,power_law_1.2,0.05185920000076294
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,128,16,16,power_law_1.01,0.1867583990097046
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,128,32,8,balanced,0.042463997999827065
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,128,16,16,balanced,0.20058667659759521
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,128,16,16,power_law_1.2,0.05151360034942627
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,128,16,16,power_law_1.01,0.2595455884933472
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,128,32,8,balanced,0.043968002001444496
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,128,16,16,power_law_1.2,0.055289602279663085
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,128,16,16,power_law_1.01,0.3521087884902954
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,128,32,8,balanced,0.041759997606277466
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,128,16,16,power_law_1.2,0.06039040088653565
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,128,16,16,power_law_1.01,0.43520641326904297
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,128,16,16,balanced,0.2752000093460083
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,128,16,16,power_law_1.01,0.570304012298584
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,128,32,8,balanced,0.056101332108179726
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,128,16,16,power_law_1.2,0.069760000705719
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,128,16,16,power_law_1.01,0.8607359886169433
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,128,32,8,balanced,0.05771199862162272
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,128,16,16,power_law_1.2,0.07473919987678528
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,128,16,16,power_law_1.01,1.7977535247802734
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,128,32,8,balanced,0.054416000843048096
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,128,16,16,power_law_1.2,0.08687999844551086
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,128,32,8,balanced,0.0631039987007777
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,128,16,16,power_law_1.2,0.09915519952774048
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,128,16,16,balanced,0.3575199842453003
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,128,32,8,balanced,0.0699946681658427
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,128,16,16,power_law_1.2,0.1229248046875
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,128,32,8,power_law_1.01,0.026873600482940675
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,128,16,16,power_law_1.2,0.14693119525909423
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,128,32,8,balanced,0.08392533659934998
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,128,32,8,power_law_1.01,0.0285504013299942
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,128,16,16,power_law_1.2,0.22271358966827393
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,128,32,8,power_law_1.01,0.02768000066280365
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,128,32,8,balanced,0.09392000238100688
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,128,16,16,balanced,0.447653333346049
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,128,16,16,power_law_1.2,0.2720128059387207
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,128,32,8,power_law_1.01,0.030668801069259642
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,128,32,8,balanced,0.11204266548156738
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,128,16,16,power_law_1.2,0.399072003364563
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,128,32,8,power_law_1.01,0.031916800141334536
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,128,32,8,power_law_1.01,0.03307519853115082
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,128,32,8,balanced,0.12920533617337546
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,128,16,16,power_law_1.2,0.508454418182373
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,128,32,8,power_law_1.01,0.034169599413871765
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,128,16,16,power_law_1.2,0.6610943794250488
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,128,32,8,balanced,0.17667200167973837
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,128,32,8,power_law_1.01,0.03372159898281098
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,128,16,16,power_law_1.2,0.9797375679016114
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,128,32,8,power_law_1.01,0.03637759983539581
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,128,16,16,power_law_1.2,1.8796863555908203
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,128,32,8,power_law_1.01,0.03699840009212494
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,128,16,16,balanced,0.6902026335398356
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,128,32,8,balanced,0.21133333444595337
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,128,32,8,power_law_1.01,0.03482879996299744
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,128,32,8,power_law_1.01,0.04280959963798523
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,128,32,8,power_law_1.01,0.04248960018157959
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,128,32,8,balanced,0.2899786631266276
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,128,32,8,power_law_1.01,0.04115839898586273
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,128,32,8,power_law_1.01,0.05678719878196716
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,128,32,8,power_law_1.01,0.05667200088500977
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,128,32,8,balanced,0.37335999806722003
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,128,32,8,power_law_1.01,0.0582144021987915
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,128,32,8,power_law_1.01,0.06835200190544129
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,128,32,8,power_law_1.01,0.0739135980606079
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,128,32,8,power_law_1.01,0.09020159840583801
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,128,32,8,balanced,0.47093331813812256
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,128,32,8,power_law_1.01,0.10084480047225952
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,128,16,16,balanced,1.3499093055725098
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,128,32,8,power_law_1.01,0.12228480577468873
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,128,32,8,power_law_1.01,0.14766720533370972
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,128,32,8,power_law_1.01,0.19224319458007813
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,128,32,8,power_law_1.01,0.2421247959136963
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,128,32,8,power_law_1.01,0.3470016002655029
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,128,32,8,balanced,0.7180480162302653
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,128,32,8,power_law_1.2,0.026726400852203368
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,128,32,8,power_law_1.01,0.4344128131866455
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,128,32,8,power_law_1.2,0.02844800055027008
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,128,32,8,power_law_1.01,0.5715392112731934
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,128,32,8,power_law_1.2,0.027481600642204285
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,128,32,8,power_law_1.01,0.8847231864929199
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,32,8,32,balanced,0.028234665592511494
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,128,32,8,power_law_1.2,0.03022719919681549
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,128,32,8,power_law_1.01,1.8045631408691407
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,32,8,32,balanced,0.02881066749493281
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,128,32,8,power_law_1.2,0.031219199299812317
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,32,8,32,balanced,0.028688001135985058
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,128,32,8,power_law_1.2,0.033062401413917544
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,32,8,32,balanced,0.032831999162832894
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,128,32,8,power_law_1.2,0.034067198634147644
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,32,8,32,balanced,0.03495466709136963
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,128,32,8,power_law_1.2,0.03370879888534546
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,32,8,32,balanced,0.040821333726247154
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,128,32,8,power_law_1.2,0.03597440123558045
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,32,8,32,balanced,0.04098666707674662
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,128,32,8,power_law_1.2,0.03688960075378418
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,32,8,32,balanced,0.04079466561476389
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,128,32,8,balanced,1.4032853444417317
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,128,32,8,power_law_1.2,0.03501439988613129
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,32,8,32,balanced,0.04113066693147024
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,128,32,8,power_law_1.2,0.0411327987909317
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,32,8,32,balanced,0.041536000867684685
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,128,32,8,power_law_1.2,0.04209280014038086
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,32,8,32,balanced,0.04144533226887385
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,128,32,8,power_law_1.2,0.040633600950241086
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,128,32,8,power_law_1.2,0.05543680191040039
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,128,32,8,power_law_1.2,0.05891839861869812
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,32,8,32,balanced,0.041834667325019836
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,128,32,8,power_law_1.2,0.060121601819992064
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,32,8,32,power_law_1.01,0.027327999472618103
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,32,8,32,balanced,0.043978666265805565
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,128,32,8,power_law_1.2,0.06837120056152343
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,32,8,32,balanced,0.047082667549451195
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,32,8,32,power_law_1.01,0.028729599714279175
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,128,32,8,power_law_1.2,0.07518079876899719
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,32,8,32,balanced,0.04770666857560476
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,32,8,32,power_law_1.01,0.028960001468658448
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,128,32,8,power_law_1.2,0.09196159839630128
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,32,8,32,balanced,0.05435200035572052
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,32,8,32,power_law_1.01,0.032025599479675294
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,32,8,32,power_law_1.2,0.027385601401329042
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,32,8,32,balanced,0.056143999099731445
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,128,32,8,power_law_1.2,0.10563839673995971
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,32,8,32,power_law_1.01,0.03383040130138397
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,32,8,32,power_law_1.2,0.028569599986076354
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,128,32,8,power_law_1.2,0.12486399412155151
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,32,8,32,balanced,0.05810666580994924
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,32,8,32,power_law_1.01,0.040089601278305055
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,32,8,32,power_law_1.2,0.028652799129486085
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,32,8,32,power_law_1.2,0.0319680005311966
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,128,32,8,power_law_1.2,0.15324800014495848
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,32,8,32,power_law_1.01,0.040652799606323245
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,32,8,32,balanced,0.061477333307266235
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,32,8,32,power_law_1.2,0.03374719917774201
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,128,32,8,power_law_1.2,0.20107519626617432
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,32,8,32,power_law_1.01,0.04083200097084046
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,32,8,32,balanced,0.06699733436107635
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,32,8,32,power_law_1.2,0.03989120125770569
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,32,8,32,power_law_1.2,0.040300801396369934
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,32,8,32,power_law_1.01,0.040838399529457094
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,128,32,8,power_law_1.2,0.2838527917861938
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,32,8,32,balanced,0.07545066873232524
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,32,8,32,power_law_1.2,0.04081279933452606
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,32,8,32,power_law_1.01,0.041126400232315063
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,128,32,8,power_law_1.2,0.39045119285583496
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,32,8,32,power_law_1.2,0.040863999724388124
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,32,8,32,balanced,0.09774933258692424
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,32,8,32,power_law_1.2,0.040915200114250184
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,32,8,32,power_law_1.01,0.04113920032978058
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,128,32,8,power_law_1.2,0.5333439826965332
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,32,8,32,power_law_1.2,0.041152000427246094
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,32,8,32,power_law_1.01,0.04196479916572571
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,32,8,32,power_law_1.2,0.04224640130996704
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,128,32,8,power_law_1.2,0.6351488113403321
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,32,8,32,balanced,0.11502933502197266
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,32,8,32,power_law_1.2,0.04382719993591309
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,32,8,32,power_law_1.01,0.044275200366973876
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,128,32,8,power_law_1.2,0.9325823783874512
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,32,8,32,power_law_1.2,0.04712960124015808
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,32,8,32,power_law_1.01,0.047391998767852786
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,32,8,32,power_law_1.2,0.04807040095329285
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,32,8,32,balanced,0.15275733669598898
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,128,32,8,power_law_1.2,1.9418304443359375
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,32,8,32,power_law_1.01,0.048153600096702574
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,32,8,32,power_law_1.2,0.0548799991607666
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,32,8,32,power_law_1.2,0.056358402967453
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,32,8,32,power_law_1.01,0.05491200089454651
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,32,8,32,power_law_1.2,0.06498559713363647
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,32,8,32,balanced,0.18712000052134195
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,32,8,32,power_law_1.01,0.05642240047454834
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,32,8,32,power_law_1.2,0.07111679911613464
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,32,8,32,power_law_1.01,0.06212480068206787
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,32,8,32,power_law_1.2,0.08353919982910156
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,32,16,16,balanced,0.0262773334980011
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,32,8,32,power_law_1.2,0.09736319780349731
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,32,8,32,power_law_1.01,0.06998400092124939
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,32,8,32,power_law_1.2,0.1481152057647705
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,32,8,32,balanced,0.2560373346010844
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,32,16,16,balanced,0.02731200059254964
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,32,8,32,power_law_1.01,0.07837439775466919
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,32,8,32,power_law_1.2,0.17633919715881347
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,32,16,16,balanced,0.026933332284291584
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,32,8,32,power_law_1.2,0.2558655977249146
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,32,8,32,power_law_1.01,0.09377920031547546
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,32,8,32,power_law_1.2,0.3091007947921753
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,32,16,16,balanced,0.03073599934577942
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,32,8,32,power_law_1.01,0.1317055940628052
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,32,8,32,power_law_1.2,0.4661248207092285
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,32,16,16,balanced,0.031898667414983116
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,32,8,32,power_law_1.01,0.15381759405136108
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,32,8,32,power_law_1.2,0.6010176181793213
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,32,8,32,balanced,0.33051733175913495
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,32,16,16,balanced,0.03342933456103007
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,32,8,32,power_law_1.2,0.7480576038360596
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,32,8,32,power_law_1.01,0.22546560764312745
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,32,16,16,balanced,0.038848000268141426
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,32,8,32,power_law_1.2,1.1767104148864747
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,32,8,32,power_law_1.01,0.2905280113220215
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,32,16,16,balanced,0.03870933254559835
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,32,8,32,power_law_1.2,2.2844287872314455
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,32,8,32,power_law_1.01,0.4581183910369873
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,32,16,16,balanced,0.03897066662708918
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,32,8,32,power_law_1.01,0.5649151802062988
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,32,8,32,balanced,0.4086506764094035
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,32,16,16,balanced,0.03885866701602936
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,32,8,32,power_law_1.01,0.7229375839233398
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,32,16,16,balanced,0.03959999978542328
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,32,16,16,balanced,0.03859733293453852
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,32,8,32,power_law_1.01,1.1571264266967773
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,32,16,16,balanced,0.040421334405740104
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,32,8,32,power_law_1.01,2.319046401977539
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,32,16,16,balanced,0.04091733445723852
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,32,16,16,balanced,0.04293333490689596
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,32,16,16,balanced,0.046682665745417275
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,32,8,32,balanced,0.6389973163604736
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,32,16,16,balanced,0.04855999847253164
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,32,16,16,balanced,0.05764266848564148
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,32,16,16,power_law_1.01,0.026060798764228822
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,32,16,16,balanced,0.06039999922116598
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,32,16,16,power_law_1.01,0.027110400795936584
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,32,16,16,balanced,0.0681386689345042
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,32,16,16,power_law_1.01,0.027500799298286437
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,32,16,16,balanced,0.07893866797288258
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,32,16,16,power_law_1.01,0.029734399914741517
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,32,16,16,power_law_1.01,0.031174400448799135
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,32,16,16,balanced,0.10150399804115295
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,32,16,16,power_law_1.2,0.025996801257133485
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,32,16,16,power_law_1.01,0.03298560082912445
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,32,16,16,balanced,0.11972799897193909
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,32,16,16,power_law_1.2,0.027059200406074523
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,32,16,16,power_law_1.01,0.03800320029258728
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,32,16,16,power_law_1.2,0.027136000990867614
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,32,16,16,power_law_1.01,0.03844479918479919
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,32,16,16,balanced,0.1590026617050171
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,32,16,16,power_law_1.2,0.030054399371147157
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,32,16,16,power_law_1.01,0.03935360014438629
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,32,8,32,balanced,1.259669303894043
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,32,16,16,power_law_1.01,0.03856000006198883
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,32,16,16,power_law_1.2,0.030943998694419862
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,32,16,16,power_law_1.01,0.03850879967212677
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,32,16,16,power_law_1.2,0.03301759958267212
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,32,16,16,balanced,0.1946986714998881
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,32,16,16,power_law_1.2,0.03829759955406189
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,32,16,16,power_law_1.01,0.03961600065231323
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,32,32,8,balanced,0.025754667818546295
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,32,16,16,power_law_1.01,0.03985919952392578
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,32,16,16,power_law_1.2,0.03811840116977692
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,32,16,16,power_law_1.01,0.04110080003738403
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,32,16,16,balanced,0.26733332872390747
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,32,32,8,balanced,0.026554666459560394
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,32,16,16,power_law_1.2,0.03861120045185089
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,32,32,8,balanced,0.02681066592534383
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,32,16,16,power_law_1.01,0.043315199017524716
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,32,16,16,power_law_1.2,0.03909760117530823
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,32,32,8,balanced,0.030762667457262676
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,32,16,16,power_law_1.01,0.04700160026550293
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,32,16,16,power_law_1.2,0.038899201154708865
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,32,32,8,balanced,0.03089066594839096
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,32,16,16,power_law_1.01,0.04999679923057556
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,32,16,16,power_law_1.2,0.03953920006752014
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,32,16,16,balanced,0.3474453290303548
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,32,32,8,balanced,0.03200533241033554
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,32,16,16,power_law_1.01,0.06223999857902527
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,32,16,16,power_law_1.2,0.04072319865226746
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,32,32,8,balanced,0.034074666599432625
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,32,16,16,power_law_1.2,0.04108160138130188
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,32,16,16,power_law_1.01,0.06733440160751343
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,32,32,8,balanced,0.03440533330043157
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,32,16,16,power_law_1.01,0.07995520234107971
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,32,16,16,power_law_1.2,0.043782401084899905
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,32,32,8,balanced,0.037402667105197906
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,32,16,16,power_law_1.01,0.09380480051040649
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,32,32,8,balanced,0.03756800045569738
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,32,16,16,power_law_1.2,0.04702079892158508
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,32,16,16,balanced,0.43795732657114667
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,32,16,16,power_law_1.01,0.13771519660949708
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,32,32,8,balanced,0.03811199963092804
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,32,16,16,power_law_1.2,0.050291198492050174
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,32,16,16,power_law_1.01,0.15644799470901488
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,32,32,8,balanced,0.03783999880154928
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,32,16,16,power_law_1.2,0.06382079720497132
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,32,32,8,balanced,0.03879466652870178
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,32,16,16,power_law_1.01,0.24844160079956054
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,32,16,16,power_law_1.2,0.069651198387146
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,32,32,8,balanced,0.0391146664818128
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,32,16,16,power_law_1.01,0.30881919860839846
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,32,16,16,power_law_1.2,0.08617600202560424
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,32,32,8,balanced,0.03972800076007843
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,32,16,16,power_law_1.01,0.4401279926300049
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,32,16,16,power_law_1.2,0.10355199575424194
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,32,32,8,balanced,0.04091733445723852
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,32,16,16,power_law_1.2,0.1630079984664917
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,32,16,16,power_law_1.01,0.593721580505371
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,32,32,8,balanced,0.04293333490689596
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,32,16,16,balanced,0.67412797609965
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,32,16,16,power_law_1.2,0.1944383978843689
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,32,16,16,power_law_1.01,0.7649856090545655
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,32,32,8,balanced,0.050293331344922386
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,32,16,16,power_law_1.2,0.28573439121246336
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,32,16,16,power_law_1.01,1.0718400001525878
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,32,16,16,power_law_1.2,0.3353600025177002
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,32,32,8,balanced,0.054976001381874084
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,32,16,16,power_law_1.01,2.211673545837402
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,32,16,16,power_law_1.2,0.4915584087371826
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,32,32,8,balanced,0.07123200098673503
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,32,16,16,power_law_1.2,0.6975168228149414
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,32,32,8,balanced,0.08303999900817871
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,32,16,16,power_law_1.2,0.8617088317871093
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,32,32,8,balanced,0.10514666636784871
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,32,16,16,power_law_1.2,1.5128064155578613
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,32,16,16,power_law_1.2,2.736390495300293
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,32,32,8,balanced,0.1246560017267863
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,32,32,8,power_law_1.01,0.02531839907169342
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,32,32,8,balanced,0.16529066363970438
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,32,32,8,power_law_1.01,0.026310399174690247
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,32,32,8,power_law_1.01,0.026822400093078614
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,32,16,16,balanced,1.3216426372528076
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,32,32,8,balanced,0.20349333683649698
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,32,32,8,power_law_1.01,0.02953599989414215
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,32,32,8,power_law_1.01,0.029875200986862183
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,32,32,8,power_law_1.2,0.025337600708007814
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,32,32,8,power_law_1.01,0.03130879998207092
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,32,32,8,balanced,0.28091200192769367
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,32,32,8,power_law_1.2,0.026335999369621277
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,32,32,8,power_law_1.01,0.03324800133705139
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,32,32,8,power_law_1.2,0.026412799954414368
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,32,32,8,power_law_1.2,0.02927359938621521
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,32,32,8,power_law_1.01,0.03330560028553009
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,32,32,8,power_law_1.2,0.02990719974040985
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,32,32,8,power_law_1.2,0.03126400113105774
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,32,32,8,power_law_1.01,0.03829120099544525
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,32,32,8,power_law_1.2,0.033055999875068666
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,32,32,8,balanced,0.3622613350550334
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,32,32,8,power_law_1.01,0.037920001149177554
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,32,32,8,power_law_1.2,0.0335999995470047
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,32,32,8,power_law_1.2,0.037785598635673524
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,32,32,8,power_law_1.01,0.037427198886871335
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,32,32,8,power_law_1.2,0.03800320029258728
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,32,32,8,power_law_1.2,0.03842560052871704
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,32,32,8,power_law_1.01,0.038649600744247434
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,32,32,8,power_law_1.2,0.03808639943599701
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,32,32,8,power_law_1.01,0.03912320137023926
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,32,32,8,power_law_1.2,0.038675200939178464
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,32,32,8,balanced,0.4585173527399699
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,32,32,8,power_law_1.2,0.041254401206970215
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,32,32,8,power_law_1.01,0.03969280123710632
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,32,32,8,power_law_1.2,0.04076800048351288
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,32,32,8,power_law_1.2,0.044352000951766966
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,32,32,8,power_law_1.01,0.04110719859600067
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,32,32,8,power_law_1.2,0.047014400362968445
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,32,32,8,power_law_1.01,0.043007999658584595
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,32,32,8,power_law_1.2,0.0581055998802185
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,32,32,8,power_law_1.01,0.04677119851112366
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,32,32,8,power_law_1.2,0.06833279728889466
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,32,32,8,power_law_1.2,0.08681600093841553
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,32,32,8,power_law_1.01,0.056460797786712646
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,32,32,8,power_law_1.2,0.09768319725990296
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,32,32,8,balanced,0.7005440394083658
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,32,32,8,power_law_1.01,0.06291199922561645
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,32,32,8,power_law_1.2,0.12735999822616578
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,32,32,8,power_law_1.2,0.1592960000038147
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,32,32,8,power_law_1.01,0.08217599987983704
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,32,32,8,power_law_1.2,0.2587455987930298
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,32,32,8,power_law_1.2,0.33702399730682375
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,32,32,8,power_law_1.01,0.0942911982536316
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,32,32,8,power_law_1.2,0.4970047950744629
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,32,32,8,power_law_1.01,0.11960320472717285
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,32,32,8,power_law_1.2,0.6266367912292481
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,32,32,8,power_law_1.01,0.15438079833984375
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,32,32,8,power_law_1.2,0.7365952014923096
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,32,32,8,power_law_1.01,0.21203839778900146
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,32,32,8,power_law_1.2,1.2608320236206054
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,32,32,8,power_law_1.01,0.2764607906341553
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,32,32,8,power_law_1.2,2.3371135711669924
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,32,32,8,power_law_1.01,0.41948161125183103
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,32,32,8,power_law_1.01,0.49743361473083497
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,32,32,8,power_law_1.01,0.651417589187622
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,32,32,8,power_law_1.01,0.9963456153869629
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,32,32,8,balanced,1.3732266426086426
TRTLLM,1.2.0rc5,NVIDIA H200,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,32,32,8,power_law_1.01,1.8757183074951171
